# Import necessary libraries
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms
from torch.utils.data import DataLoader
import numpy as np
import matplotlib.pyplot as plt

# Set device (GPU if available, else CPU)
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

train_dataset = torchvision.datasets.MNIST(root='./data', train=True, download=True)
test_dataset = torchvision.datasets.MNIST(root='./data', train=False, download=True)

print(len(train_dataset))
print(train_dataset[0])

60000
(<PIL.Image.Image image mode=L size=28x28 at 0x107CC3400>, 5)

idx = 0  # Change the index to see different images

# Show some images
fig, axes = plt.subplots(1, 5, figsize=(7, 2.5))
for i in range(5):
    axes[i].imshow(train_dataset[i+idx][0], cmap='gray')
    axes[i].set_title(f"label: {train_dataset[i+idx][1]}")
    axes[i].axis('off')

img = train_dataset[0][0]
print(np.max(img), np.min(img), np.shape(img))

255 0 (28, 28)

mnist_transform = transforms.Compose([
    transforms.ToTensor(),  # Convert image to tensor
    transforms.Normalize((0.5,), (0.5,))  # Normalize image to mean 0.5 and std 0.5
])

train_dataset = torchvision.datasets.MNIST(root='./data', train=True, download=True, transform=mnist_transform)
test_dataset = torchvision.datasets.MNIST(root='./data', train=False, download=True, transform=mnist_transform)

batchsize = 64
train_loader = DataLoader(dataset=train_dataset, batch_size=batchsize, shuffle=True)
test_loader = DataLoader(dataset=test_dataset, batch_size=batchsize, shuffle=False)

images, labels = next(iter(train_loader))
print("Input batch shape: ", images.shape)
print("Output batch shape: ", labels.shape)

Input batch shape:  torch.Size([64, 1, 28, 28])
Output batch shape:  torch.Size([64])

images, labels = next(iter(train_loader))
idx = 0  # Change the index to see different images

# Show some images
fig, axes = plt.subplots(1, 5, figsize=(7, 2.5))
for i in range(5):
    axes[i].imshow(images[i+idx][0], cmap='gray')
    axes[i].set_title(f"label: {labels[i+idx]}")
    axes[i].axis('off')

class SimpleNN(nn.Module):
    def __init__(self, input_size=28*28, num_classes=10, hidden_size=128):
        super(SimpleNN, self).__init__()
        self.flatten = nn.Flatten()
        self.fc1 = nn.Linear(input_size, hidden_size)
        self.activation = nn.ReLU()
        self.fc2 = nn.Linear(hidden_size, num_classes)

    def forward(self, x):
        x = self.flatten(x)
        x = self.fc1(x)
        x = self.activation(x)
        x = self.fc2(x)
        return x

model = SimpleNN().to(device)
print(model) # Look at the model architecture

SimpleNN(
  (flatten): Flatten(start_dim=1, end_dim=-1)
  (fc1): Linear(in_features=784, out_features=128, bias=True)
  (activation): ReLU()
  (fc2): Linear(in_features=128, out_features=10, bias=True)
)

# Define the loss function
criterion = nn.CrossEntropyLoss()

# Feel free to change the optimizer and its hyperparameters
learning_rate = 1e-3
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

def train(model, train_loader, criterion, optimizer, num_epochs=10):
    model.train()  # Set the model to training mode
    for epoch in range(num_epochs): # Loop through the dataset multiple epochs
        for i, (images, labels) in enumerate(train_loader): # Loop through batches in the train loader
            images, labels = images.to(device), labels.to(device) # Move data to device (GPU if available)
            outputs = model(images) # Forward pass
            loss = criterion(outputs, labels) # Compute loss

            optimizer.zero_grad() # Prepare for backward pass
            loss.backward() # Backward pass
            optimizer.step() # Update model parameters

            if (i+1) % 400 == 0:
                print(f'Epoch [{epoch+1}/{num_epochs}], Step [{i+1}/{len(train_loader)}], Loss: {loss.item():.4f}')

train(model, train_loader, criterion, optimizer, num_epochs=10)

Epoch [1/10], Step [400/938], Loss: 0.2974
Epoch [1/10], Step [800/938], Loss: 0.4021
Epoch [2/10], Step [400/938], Loss: 0.1189
Epoch [2/10], Step [800/938], Loss: 0.1314
Epoch [3/10], Step [400/938], Loss: 0.2653
Epoch [3/10], Step [800/938], Loss: 0.1246
Epoch [4/10], Step [400/938], Loss: 0.2013
Epoch [4/10], Step [800/938], Loss: 0.0542
Epoch [5/10], Step [400/938], Loss: 0.1582
Epoch [5/10], Step [800/938], Loss: 0.1365
Epoch [6/10], Step [400/938], Loss: 0.0242
Epoch [6/10], Step [800/938], Loss: 0.0597
Epoch [7/10], Step [400/938], Loss: 0.0699
Epoch [7/10], Step [800/938], Loss: 0.0291
Epoch [8/10], Step [400/938], Loss: 0.0966
Epoch [8/10], Step [800/938], Loss: 0.0313
Epoch [9/10], Step [400/938], Loss: 0.1028
Epoch [9/10], Step [800/938], Loss: 0.0948
Epoch [10/10], Step [400/938], Loss: 0.0491
Epoch [10/10], Step [800/938], Loss: 0.0685

# Evaluation on the test set
model.eval()
correct = 0
total = 0

with torch.no_grad():
    for images, labels in test_loader:
        images, labels = images.to(device), labels.to(device)
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

accuracy = correct / total
print(f"Test Accuracy: {accuracy * 100:.2f}%")

Test Accuracy: 96.73%

# Redefine a loader to allow for visualization of random test images
random_test_loader = DataLoader(dataset=test_dataset, batch_size=5, shuffle=True)

images, labels = next(iter(random_test_loader))
images, labels = images.to(device), labels.to(device)
outputs = model(images)
_, predictions = torch.max(outputs, 1)

# Show some images
fig, axes = plt.subplots(1, 5, figsize=(7, 2.5))
for i in range(5):
    axes[i].imshow(images[i][0], cmap='gray')
    axes[i].set_title(f"label: {labels[i]} \n pred: {predictions[i]}")
    axes[i].axis('off')

Neural Network Hands-On Tutorial Part 2¶

MNIST Classification Task¶

Loading the MNIST Dataset¶

Looking at the Dataset¶

Looking at the Dataset¶

Looking at the Dataset¶

Data Preprocessing¶

Define the neural network structure¶

Define the loss function¶

Define an optimizer¶

Define the training loop¶

Evaluating the model¶

Visualize the model predictions¶

What's next¶

Bonus¶