import torch
import torchvision
import numpy as np


## Create random tensor to represent a 7x7 image with 3 channels
random_tensor = torch.rand(1,3,7,7)

## Use random_tensor as input into Conv2d
from torch import nn
trial_net = nn.Conv2d(in_channels=3, out_channels=4, kernel_size=3, stride=1)
trial_output = trial_net(random_tensor)

## Check output shape
print(trial_output.shape)

## Check weights shape
print(trial_net.weight.shape)

## Check bias shape
print(trial_net.bias.shape)

torch.Size([1, 4, 5, 5])
torch.Size([4, 3, 3, 3])
torch.Size([4])


## Sorry, this is an easier way to display a gif in HTML generated from a Python notebook
from IPython.display import HTML
HTML('<img src="https://miro.medium.com/v2/resize:fit:1400/1*ubRrYAZJUlCcqg7WoKjLgQ.gif">')


trial_net.weight[1,:,:]

tensor([[[ 0.0967,  0.0033,  0.1359],
         [-0.0457, -0.1048, -0.0194],
         [-0.1064,  0.1163,  0.1190]],

        [[-0.1144,  0.1168, -0.1006],
         [-0.0906,  0.1913, -0.0713],
         [ 0.0328,  0.0790,  0.0957]],

        [[-0.1570,  0.0912, -0.1159],
         [ 0.1386, -0.0825,  0.0475],
         [-0.0678, -0.0566, -0.0273]]], grad_fn=<SliceBackward0>)


random_tensor = torch.rand(1,1,4,4)
print(random_tensor)

tensor([[[[0.8892, 0.0091, 0.6755, 0.4736],
          [0.6761, 0.7187, 0.3776, 0.3354],
          [0.6368, 0.5166, 0.9557, 0.8515],
          [0.7688, 0.9752, 0.5153, 0.7582]]]])


trial_pool = nn.MaxPool2d(kernel_size = 2, stride = 2)
pool_output = trial_pool(random_tensor)
print(pool_output)

tensor([[[[0.8892, 0.6755],
          [0.9752, 0.9557]]]])


avg_pool = nn.AvgPool2d(kernel_size = 2, stride = 2)
pool_output = avg_pool(random_tensor)
print(pool_output)

tensor([[[[0.5733, 0.4655],
          [0.7244, 0.7702]]]])


## Randomly generated 1x5x5 tensor
random_tensor = torch.rand(1,1,5,5)

## Two different pooling operations
ceil_false = nn.MaxPool2d(kernel_size = 2, stride = 2, ceil_mode = False)
ceil_true = nn.MaxPool2d(kernel_size = 2, stride = 2, ceil_mode = True)

## Note the difference in output shape
print(ceil_false(random_tensor).shape)
print(ceil_true(random_tensor).shape)

torch.Size([1, 1, 2, 2])
torch.Size([1, 1, 3, 3])


## Randomly generated 1x5x5 tensor
random_tensor = torch.rand(1,1,5,5)

## Add padding
padding_step = nn.ZeroPad2d(padding=1)
padded_input = padding_step(random_tensor)
print(padded_input)

## See the impact
print(ceil_false(padded_input))
print(ceil_false(random_tensor))

tensor([[[[0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
          [0.0000, 0.3443, 0.2315, 0.0039, 0.4375, 0.4186, 0.0000],
          [0.0000, 0.0356, 0.5737, 0.1951, 0.0751, 0.9896, 0.0000],
          [0.0000, 0.4622, 0.6268, 0.4209, 0.1618, 0.8350, 0.0000],
          [0.0000, 0.0370, 0.7792, 0.1690, 0.7236, 0.1897, 0.0000],
          [0.0000, 0.1471, 0.4918, 0.5798, 0.9537, 0.3755, 0.0000],
          [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000]]]])
tensor([[[[0.3443, 0.2315, 0.4375],
          [0.4622, 0.6268, 0.9896],
          [0.1471, 0.7792, 0.9537]]]])
tensor([[[[0.5737, 0.4375],
          [0.7792, 0.7236]]]])


from torch import nn

class my_net(nn.Module):
    
    ## Constructor commands
    def __init__(self):
        super(my_net, self).__init__()
        
        ## Define architecture
        self.conv_stack = nn.Sequential(
            nn.Conv2d(1,10,4,1),
            nn.ReLU(),
            nn.MaxPool2d(2,2),
            nn.Conv2d(10,30,2,1),
            nn.ReLU(),
            nn.MaxPool2d(2,2),
            nn.Flatten(),
            nn.Linear(750, 250),
            nn.ReLU(),
            nn.Linear(250, 10)
        )
    
    ## Function to generate predictions
    def forward(self, x):
        scores = self.conv_stack(x)
        return scores


## Hyperparms
epochs = 300
lrate = 0.025
bsize = 100

## For reproduction purposes 
torch.manual_seed(7)

## Cost Function
cost_fn = nn.CrossEntropyLoss()

## Intialize the model
net = my_net()

## Optimizer (Stochastic Gradient Descent)
optimizer = torch.optim.SGD(net.parameters(), lr=lrate)


### Read flattened, processed data
import pandas as pd
fash_mnist = pd.read_csv("https://remiller1450.github.io/data/fashion_mnist_train.csv")

## Train-test split
from sklearn.model_selection import train_test_split
train_fash, test_fash = train_test_split(fash_mnist, test_size=0.1, random_state=5)

### Separate the label column (outcome)
train_y = train_fash['y']
train_X = train_fash.drop(['y'], axis=1)
test_y = test_fash['y']
test_X = test_fash.drop(['y'], axis=1)

### Convert to numpy array then reshape to 900 by 28 by 28
mnist_unflattened = train_X.to_numpy()
mnist_unflattened = mnist_unflattened.reshape(900,28,28)

## Convert to tensor
mnist_tensor = torch.from_numpy(mnist_unflattened)
train_X = torch.reshape(mnist_tensor, [900,1,28,28])

## Make DataLoader
from torch.utils.data import DataLoader, TensorDataset
y_tensor = torch.Tensor(train_y)
train_loader = DataLoader(TensorDataset(train_X.type(torch.FloatTensor), 
                        y_tensor.type(torch.LongTensor)), batch_size=bsize)


## Initial values for cost tracking
track_cost = np.zeros(epochs)
cur_cost = 0.0

## Loop through the data
for epoch in range(epochs):
    
    cur_cost = 0.0
    correct = 0.0
    
    ## train_loader is iterable and numbers knows the batch
    for i, data in enumerate(train_loader, 0):
        
        ## The input tensor and labels tensor for the current batch
        inputs, labels = data
        
        ## Clear the gradient from the previous batch
        optimizer.zero_grad()
        
        ## Provide the input tensor into the network to get outputs
        outputs = net(inputs)
        
        ## Calculate the cost for the current batch
        ## nn.Softmax is used because net outputs prediction scores and our cost function expects probabilities and labels
        cost = cost_fn(nn.Softmax(dim=1)(outputs), labels)
        
        ## Calculate the gradient
        cost.backward()
        
        ## Update the model parameters using the gradient
        optimizer.step()
        
        ## Track the current cost (accumulating across batches)
        cur_cost += cost.item()
    
    ## Store the accumulated cost at each epoch
    track_cost[epoch] = cur_cost
    # print(f"Epoch: {epoch} Cost: {cur_cost}") ## Uncomment this if you want printed updates


import matplotlib.pyplot as plt
plt.plot(np.linspace(0, epochs, epochs), track_cost)
plt.show()


## Make test outcomes into a tensor
test_y_tensor = torch.Tensor(test_y.to_numpy())

### Convert to numpy array then reshape
test_unflattened = test_X.to_numpy().reshape(len(test_y),1,28,28)

## Convert test images into a tensor
test_tensor = torch.from_numpy(test_unflattened)

## Combine X and y tensors into a TensorDataset and DataLoader
test_loader = DataLoader(TensorDataset(test_tensor.type(torch.FloatTensor), 
                                       test_y_tensor.type(torch.LongTensor)), batch_size=bsize)

## Repeat evaluation loop suing the test data
correct = 0
total = 0
with torch.no_grad():
    for data in test_loader:
        images, labels = data
        outputs = net(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()
print(correct/total)

0.78


## Compose Transformations
from torchvision import transforms
data_transforms = transforms.Compose([
        transforms.GaussianBlur(kernel_size=(5,5), sigma=(0.1, 5)),
        transforms.RandomHorizontalFlip()
])


## Re-run the training loop, notice the new data_transforms() command
track_cost = np.zeros(epochs)
cur_cost = 0.0

for epoch in range(epochs):
    cur_cost = 0.0
    correct = 0.0
    
    for i, data in enumerate(train_loader, 0):
        inputs, labels = data
        
        ## Transform the input data using our data augmentation strategies
        inputs = data_transforms(inputs)
        
        ## Same as before
        optimizer.zero_grad()
        outputs = net(inputs)
        cost = cost_fn(nn.Softmax(dim=1)(outputs), labels)
        cost.backward()
        optimizer.step()
        cur_cost += cost.item()
    
    ## Store the accumulated cost at each epoch
    track_cost[epoch] = cur_cost
    # print(f"Epoch: {epoch} Cost: {cur_cost}") ## Uncomment this if you want printed updates
    
plt.plot(np.linspace(0, epochs, epochs), track_cost)
plt.show()

Lab 8 (part 2) - Convolutional Neural Networks¶

Part 1 - Convolutional Layers¶

Question #1¶

Part 2 - Pooling Layers¶

Question #2¶

Part 3 - Padding¶

Part 4 - Example (Fashion MNIST)¶

Question 3¶

Part 5 - Data Augmentation using Transformations¶

Question #4 (Cats vs. Dogs revisited)¶