diff --git a/computer_vision/mnist_classifier.py b/computer_vision/mnist_classifier.py
new file mode 100644
index 000000000000..dcc7efb1e1f8
--- /dev/null
+++ b/computer_vision/mnist_classifier.py
@@ -0,0 +1,176 @@
+"""
+This program is a MNIST classifier using AlexNet.
+
+For example, to train and test AlexNet with 1 and 2 MNIST samples with 4 training epochs.
+The command line input should be:
+python program.py 1 2 4
+
+"""
+
+import sys
+import torch
+import torch.nn as n
+import torchvision.datasets as dset
+import torchvision.transforms
+from torch.autograd import Variable
+import torch.nn.functional as f
+import torch.optim
+
+
+class AlexNet(n.Module):
+    def __init__(self, num):
+        super().__init__()
+        self.feature = n.Sequential(
+            # Define feature extractor here...
+            n.Conv2d(1, 32, kernel_size=5, stride=1, padding=1),
+            n.ReLU(inplace=True),
+            n.Conv2d(32, 64, kernel_size=3, padding=1),
+            n.ReLU(inplace=True),
+            n.MaxPool2d(kernel_size=2, stride=2),
+            n.Conv2d(64, 96, kernel_size=3, padding=1),
+            n.ReLU(inplace=True),
+            n.Conv2d(96, 64, kernel_size=3, padding=1),
+            n.ReLU(inplace=True),
+            n.Conv2d(64, 32, kernel_size=3, padding=1),
+            n.ReLU(inplace=True),
+            n.MaxPool2d(kernel_size=2, stride=1),
+        )
+
+        self.classifier = n.Sequential(
+            # Define classifier here...
+            n.Dropout(),
+            n.Linear(32 * 12 * 12, 2048),
+            n.ReLU(inplace=True),
+            n.Dropout(),
+            n.Linear(2048, 1024),
+            n.ReLU(inplace=True),
+            n.Linear(1024, 10),
+        )
+
+    def forward(self, x):
+        # define forward network 'x' that combines feature extractor and classifier
+        x = self.feature(x)
+        x = x.view(x.size(0), -1)
+        x = self.classifier(x)
+        return x
+
+
+def load_subset(full_train_set, full_test_set, label_one, label_two):
+    # Sample the correct train labels
+    train_set = []
+    data_lim = 20000
+    for data in full_train_set:
+        if data_lim > 0:
+            data_lim -= 1
+            if data[1] == label_one or data[1] == label_two:
+                train_set.append(data)
+        else:
+            break
+
+    test_set = []
+    data_lim = 1000
+    for data in full_test_set:
+        if data_lim > 0:
+            data_lim -= 1
+            if data[1] == label_one or data[1] == label_two:
+                test_set.append(data)
+        else:
+            break
+
+    return train_set, test_set
+
+
+def train(model, optimizer, train_loader, epoch):
+    model.train()
+    for data, target in enumerate(train_loader):
+        if torch.cuda.is_available():
+            data, target = data.cuda(), target.cuda()
+        data, target = Variable(data), Variable(target)
+        optimizer.zero_grad()
+        output = model(data)
+        loss = f.cross_entropy(output, target)
+        loss.backward()
+        optimizer.step()
+
+
+def test(model, test_loader):
+    model.eval()
+    test_loss = 0
+    correct = 0
+    for data, target in test_loader:
+        if torch.cuda.is_available():
+            data, target = data.cuda(), target.cuda()
+        with torch.no_grad():
+            data, target = Variable(data), Variable(target)
+        output = model(data)
+        test_loss += F.cross_entropy(output, target, reduction="sum").item()
+        # size_average=False
+        pred = output.data.max(1, keepdim=True)[1]
+        # get the index of the max log-probability
+        correct += pred.eq(target.data.view_as(pred)).long().cpu().sum()
+
+    test_loss /= len(test_loader.dataset)
+    acc = 100.0 * float(correct.to(torch.device("cpu")).numpy())
+    test_accuracy = acc / len(test_loader.dataset)
+    return test_accuracy
+
+
+""" Start to call """
+
+if __name__ == "__main__":
+    if len(sys.argv) == 3:
+        print("Usage: python assignment.py <number> <number>")
+        sys.exit(1)
+
+    input_data_one = sys.argv[1].strip()
+    input_data_two = sys.argv[2].strip()
+    epochs = sys.argv[3].strip()
+
+    """  Call to function that will perform the computation. """
+    if input_data_one.isdigit() and input_data_two.isdigit() and epochs.isdigit():
+        label_one = int(input_data_one)
+        label_two = int(input_data_two)
+        epochs = int(epochs)
+
+        if label_one != label_two and 0 <= label_one <= 9 and 0 <= label_two <= 9:
+            torch.manual_seed(42)
+            # Load MNIST dataset
+            trans = transforms.Compose(
+                [transforms.ToTensor(), transforms.Normalize((0.5,), (1.0,))]
+            )
+            full_train_set = dset.MNIST(
+                root="./data", train=True, transform=trans, download=True
+            )
+            full_test_set = dset.MNIST(root="./data", train=False, transform=trans)
+            batch_size = 16
+            # Get final train and test sets
+            train_set, test_set = load_subset(
+                full_train_set, full_test_set, label_one, label_two
+            )
+
+            train_loader = torch.utils.data.DataLoader(
+                dataset=train_set, batch_size=batch_size, shuffle=False
+            )
+            test_loader = torch.utils.data.DataLoader(
+                dataset=test_set, batch_size=batch_size, shuffle=False
+            )
+
+            model = AlexNet()
+            if torch.cuda.is_available():
+                model.cuda()
+
+            optimizer = optim.SGD(model.parameters(), lr=0.01)
+
+            for epoch in range(1, epochs + 1):
+                train(model, optimizer, train_loader, epoch)
+                accuracy = test(model, test_loader)
+
+            print(round(accuracy, 2))
+
+        else:
+            print("Invalid input")
+    else:
+        print("Invalid input")
+
+
+""" End to call """