import torch
import torchvision
import numpy as np


## Create random tensor to represent a 7x7 image with 3 channels
random_tensor = torch.rand(1,3,7,7)

## Use random_tensor as input into Conv2d
from torch import nn
trial_net = nn.Conv2d(in_channels=3, out_channels=4, kernel_size=3, stride=1)
trial_output = trial_net(random_tensor)

## Check output shape
print(trial_output.shape)

torch.Size([1, 4, 5, 5])


## Check weights shape
print(trial_net.weight.shape)

## Check bias shape
print(trial_net.bias.shape)

torch.Size([4, 3, 3, 3])
torch.Size([4])


## Sorry, it's hard to embed gifs into Markdown chunks in a Python Notebook
from IPython.display import HTML
HTML('<img src="https://miro.medium.com/v2/resize:fit:1400/1*ubRrYAZJUlCcqg7WoKjLgQ.gif">')


trial_net.weight[1,:,:]

tensor([[[ 0.1786, -0.0736,  0.1632],
         [-0.1543,  0.0344, -0.0067],
         [-0.0531, -0.0487,  0.1482]],

        [[ 0.0546,  0.1791, -0.0844],
         [-0.1099,  0.1227,  0.0527],
         [ 0.1037,  0.1866,  0.1703]],

        [[-0.0082,  0.1250, -0.0716],
         [-0.1125, -0.1776,  0.1115],
         [-0.0641, -0.0270,  0.0127]]], grad_fn=<SliceBackward0>)


random_tensor = torch.rand(1,1,4,4)
print(random_tensor)

tensor([[[[0.4082, 0.5160, 0.9411, 0.7076],
          [0.3695, 0.8186, 0.9490, 0.3259],
          [0.5255, 0.9043, 0.4681, 0.2005],
          [0.6820, 0.0663, 0.3570, 0.7139]]]])


trial_pool = nn.MaxPool2d(kernel_size = 2, stride = 2)
pool_output = trial_pool(random_tensor)
print(pool_output)

tensor([[[[0.8186, 0.9490],
          [0.9043, 0.7139]]]])


avg_pool = nn.AvgPool2d(kernel_size = 2, stride = 2)
pool_output = avg_pool(random_tensor)
print(pool_output)

tensor([[[[0.5281, 0.7309],
          [0.5445, 0.4349]]]])


## Randomly generated 1x5x5 tensor
random_tensor = torch.rand(1,1,5,5)

## Two different pooling operations
ceil_false = nn.MaxPool2d(kernel_size = 2, stride = 2, ceil_mode = False)
ceil_true = nn.MaxPool2d(kernel_size = 2, stride = 2, ceil_mode = True)

## Note the difference in output shape
print(ceil_false(random_tensor).shape)
print(ceil_true(random_tensor).shape)

torch.Size([1, 1, 2, 2])
torch.Size([1, 1, 3, 3])


## Trial_net for Question #2
trial_net = nn.Conv2d(in_channels=3, out_channels=4, kernel_size=3, stride=1)


## Randomly generated 1x5x5 tensor
random_tensor = torch.rand(1,1,5,5)

## Add padding
padding_step = nn.ZeroPad2d(padding=1)
padded_input = padding_step(random_tensor)
print(padded_input)

## See the impact
print(ceil_false(padded_input))
print(ceil_false(random_tensor))

tensor([[[[0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000],
          [0.0000, 0.8166, 0.6145, 0.7464, 0.4755, 0.0061, 0.0000],
          [0.0000, 0.0585, 0.0078, 0.4892, 0.9638, 0.5208, 0.0000],
          [0.0000, 0.9876, 0.1788, 0.5228, 0.1252, 0.1227, 0.0000],
          [0.0000, 0.3907, 0.1972, 0.1292, 0.3325, 0.4888, 0.0000],
          [0.0000, 0.5706, 0.8735, 0.6341, 0.6893, 0.1471, 0.0000],
          [0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000, 0.0000]]]])
tensor([[[[0.8166, 0.7464, 0.4755],
          [0.9876, 0.5228, 0.9638],
          [0.5706, 0.8735, 0.6893]]]])
tensor([[[[0.8166, 0.9638],
          [0.9876, 0.5228]]]])


from torch import nn

class my_net(nn.Module):
    
    ## Constructor commands
    def __init__(self):
        super(my_net, self).__init__()
        
        ## Define architecture
        self.conv_stack = nn.Sequential(
            nn.Conv2d(1,10,4,1),
            nn.ReLU(),
            nn.MaxPool2d(2,2),
            nn.Conv2d(10,30,2,1),
            nn.ReLU(),
            nn.MaxPool2d(2,2),
            nn.Flatten(),
            nn.Linear(750, 250),
            nn.ReLU(),
            nn.Linear(250, 10)
        )
    
    ## Function to generate predictions
    def forward(self, x):
        scores = self.conv_stack(x)
        return scores


## Hyperparms
epochs = 300
lrate = 0.025
bsize = 100

## For reproduction purposes 
torch.manual_seed(7)

## Cost Function
cost_fn = nn.CrossEntropyLoss()

## Intialize the model
net = my_net()

## Optimizer (Stochastic Gradient Descent)
optimizer = torch.optim.SGD(net.parameters(), lr=lrate)


### Read flattened, processed data
import pandas as pd
fash_mnist = pd.read_csv("https://remiller1450.github.io/data/fashion_mnist_train.csv")

## Train-test split
from sklearn.model_selection import train_test_split
train_fash, test_fash = train_test_split(fash_mnist, test_size=0.1, random_state=5)

### Separate the label column (outcome)
train_y = train_fash['y']
train_X = train_fash.drop(['y'], axis=1)
test_y = test_fash['y']
test_X = test_fash.drop(['y'], axis=1)

### Convert to numpy array then reshape to 900 by 28 by 28
mnist_unflattened = train_X.to_numpy()
mnist_unflattened = mnist_unflattened.reshape(900,28,28)

## Convert to tensor
mnist_tensor = torch.from_numpy(mnist_unflattened)
train_X = torch.reshape(mnist_tensor, [900,1,28,28])

## Make DataLoader
from torch.utils.data import DataLoader, TensorDataset
y_tensor = torch.Tensor(train_y)
train_loader = DataLoader(TensorDataset(train_X.type(torch.FloatTensor), 
                        y_tensor.type(torch.LongTensor)), batch_size=bsize)


## Initial values for cost tracking
track_cost = np.zeros(epochs)
cur_cost = 0.0

## Loop through the data
for epoch in range(epochs):
    
    cur_cost = 0.0
    correct = 0.0
    
    ## train_loader is iterable and numbers knows the batch
    for i, data in enumerate(train_loader, 0):
        
        ## The input tensor and labels tensor for the current batch
        inputs, labels = data
        
        ## Clear the gradient from the previous batch
        optimizer.zero_grad()
        
        ## Provide the input tensor into the network to get outputs
        outputs = net(inputs)
        
        ## Calculate the cost for the current batch
        ## nn.Softmax is used because net outputs prediction scores and our cost function expects probabilities and labels
        cost = cost_fn(nn.Softmax(dim=1)(outputs), labels)
        
        ## Calculate the gradient
        cost.backward()
        
        ## Update the model parameters using the gradient
        optimizer.step()
        
        ## Track the current cost (accumulating across batches)
        cur_cost += cost.item()
    
    ## Store the accumulated cost at each epoch
    track_cost[epoch] = cur_cost
    # print(f"Epoch: {epoch} Cost: {cur_cost}") ## Uncomment this if you want printed updates


import matplotlib.pyplot as plt
plt.plot(np.linspace(0, epochs, epochs), track_cost)
plt.show()


## Make test outcomes into a tensor
test_y_tensor = torch.Tensor(test_y.to_numpy())

### Convert to numpy array then reshape
test_unflattened = test_X.to_numpy().reshape(len(test_y),1,28,28)

## Convert test images into a tensor
test_tensor = torch.from_numpy(test_unflattened)

## Combine X and y tensors into a TensorDataset and DataLoader
test_loader = DataLoader(TensorDataset(test_tensor.type(torch.FloatTensor), 
                                       test_y_tensor.type(torch.LongTensor)), batch_size=bsize)

## Repeat evaluation loop suing the test data
correct = 0
total = 0
with torch.no_grad():
    for data in test_loader:
        images, labels = data
        outputs = net(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()
print(correct/total)

0.78


## Compose our set of data augmentation transformations
from torchvision import transforms
data_transforms = transforms.Compose([
        transforms.GaussianBlur(kernel_size=(5,5), sigma=(0.1, 5)),
        transforms.RandomHorizontalFlip()
])


## Re-run the training loop, notice the new data_transforms() command
track_cost = np.zeros(epochs)
cur_cost = 0.0

for epoch in range(epochs):
    cur_cost = 0.0
    correct = 0.0
    
    for i, data in enumerate(train_loader, 0):
        inputs, labels = data
        
        ## Transform the input data using our data augmentation strategies
        inputs = data_transforms(inputs)
        
        ## Same as before
        optimizer.zero_grad()
        outputs = net(inputs)
        cost = cost_fn(nn.Softmax(dim=1)(outputs), labels)
        cost.backward()
        optimizer.step()
        cur_cost += cost.item()
    
    ## Store the accumulated cost at each epoch
    track_cost[epoch] = cur_cost
    # print(f"Epoch: {epoch} Cost: {cur_cost}") ## Uncomment this if you want printed updates
    
plt.plot(np.linspace(0, epochs, epochs), track_cost)
plt.show()

Introduction to PyTorch - Part 2 (convolutional neural networks)¶

Part 1 - Convolutional Layers¶

Part 2 - Pooling Layers¶

Part 3 - Padding¶

Part 4 - Putting Together an Architecture for Fashion MNIST¶

Part 5 - Data Augmentation using Transformations¶