import numpy as np
import time
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
import torchvision
from torch.utils.data.sampler import SubsetRandomSampler
import torchvision.transforms as transforms
import matplotlib.pyplot as plt


from google.colab import drive
drive.mount('/content/gdrive')

Mounted at /content/gdrive


cd gdrive/MyDrive/EngSci 2T1 + PEY/Year 4/Summer/APS360/Labs/Lab_3_Gesture_Recognition

/content/gdrive/MyDrive/EngSci 2T1 + PEY/Year 4/Summer/APS360/Labs/Lab_3_Gesture_Recognition


# Data Loading and Splitting
np.random.seed(1000)
indices = list(range(400, 721))
chosen_indices = np.random.choice(indices, (2, 30), replace=False)

def train_valid_file(filename):
    val_file = any(student in filename for student in chosen_indices.astype(str)[0])
    test_file = any(student in filename for student in chosen_indices.astype(str)[1])
    train_file = not(val_file or test_file)
    return train_file

def val_valid_file(filename):
    val_file = any(student in filename for student in chosen_indices.astype(str)[0])
    test_file = any(student in filename for student in chosen_indices.astype(str)[1])
    train_file = not(val_file or test_file)
    return val_file

def test_valid_file(filename):
    val_file = any(student in filename for student in chosen_indices.astype(str)[0])
    test_file = any(student in filename for student in chosen_indices.astype(str)[1])
    train_file = not(val_file or test_file)
    return test_file

transform = transforms.Compose(
        [transforms.ToTensor(),
         transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])

train_data = torchvision.datasets.ImageFolder('./Lab_3_Gestures_W21', loader=plt.imread, is_valid_file=train_valid_file, transform=transform)
val_data = torchvision.datasets.ImageFolder('./Lab_3_Gestures_W21', loader=plt.imread, is_valid_file=val_valid_file, transform=transform)
test_data = torchvision.datasets.ImageFolder('./Lab_3_Gestures_W21', loader=plt.imread, is_valid_file=test_valid_file, transform=transform)

total_data = len(train_data) + len(val_data) + len(test_data)

print("The number of training images is", len(train_data), ", which is", len(train_data)/total_data*100, "% of the entire dataset.")
print("The number of validation images is", len(val_data), ", which is", len(val_data)/total_data*100, "% of the entire dataset.")
print("The number of test images is", len(test_data), ", which is", len(test_data)/total_data*100, "% of the entire dataset.")

The number of training images is 6160 , which is 81.09531332280147 % of the entire dataset.
The number of validation images is 682 , which is 8.978409689310162 % of the entire dataset.
The number of test images is 754 , which is 9.926276987888363 % of the entire dataset.


class CNN(nn.Module):
    def __init__(self):
        super(CNN, self).__init__()
        self.name = "cnn"
        self.conv1 = nn.Conv2d(3, 5, 5)
        self.pool = nn.MaxPool2d(2, 2)
        self.conv2 = nn.Conv2d(5, 10, 5)
        self.fc1 = nn.Linear(10 * 53 * 53, 32)
        self.fc2 = nn.Linear(32, 9)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = x.view(-1, 10 * 53 * 53)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        x = x.squeeze(1) # Flatten to [batch_size]
        return x


def get_model_name(name, batch_size, learning_rate, epoch):
    path = "model_{0}_bs{1}_lr{2}_epoch{3}".format(name,
                                                   batch_size,
                                                   learning_rate,
                                                   epoch)
    return path


def get_accuracy(model, batch_size, train=False):
    if train:
        data = train_data
    else:
        data = val_data
    correct = 0
    total = 0
    for imgs, labels in torch.utils.data.DataLoader(data, batch_size=batch_size):
        
        
        #############################################
        # To Enable GPU Usage
        if use_cuda and torch.cuda.is_available():
          imgs = imgs.cuda()
          labels = labels.cuda()
        #############################################

        
        output = model(imgs)
        
        # Select index with maximum prediction score
        pred = output.max(1, keepdim=True)[1]
        correct += pred.eq(labels.view_as(pred)).sum().item()
        total += imgs.shape[0]
    return correct / total


def train(model, data, batch_size=64, learning_rate=0.001, num_epochs=30):
    torch.manual_seed(1000)
    train_loader = torch.utils.data.DataLoader(data, batch_size=batch_size, shuffle=True)
    criterion = nn.CrossEntropyLoss()
    optimizer = optim.SGD(model.parameters(), lr=learning_rate, momentum=0.9)

    iters, losses, train_acc, val_acc = [], [], [], []

    # Training
    start_time = time.time()
    n = 0 # the number of iterations
    for epoch in range(num_epochs):
        for imgs, labels in iter(train_loader):
          
          
            #############################################
            # To Enable GPU Usage
            if use_cuda and torch.cuda.is_available():
              imgs = imgs.cuda()
              labels = labels.cuda()
            #############################################
            
              
            out = model(imgs)             # forward pass
            loss = criterion(out, labels) # compute the total loss
            loss.backward()               # backward pass (compute parameter updates)
            optimizer.step()              # make the updates for each parameter
            optimizer.zero_grad()         # a clean up step for PyTorch

            # Save the current training information
            iters.append(n)
            losses.append(float(loss)/batch_size)             # compute *average* loss
            n += 1
        train_acc.append(get_accuracy(model, batch_size=batch_size, train=True)) # compute training accuracy 
        val_acc.append(get_accuracy(model, batch_size=batch_size, train=False))  # compute validation accuracy
        print(("Epoch {}: Train acc: {} |"+"Validation acc: {}").format(
                epoch + 1,
                train_acc[-1],
                val_acc[-1]))
        # Save the current model (checkpoint) to a file
        model_path = get_model_name(model.name, batch_size, learning_rate, epoch)
        torch.save(model.state_dict(), model_path)
    print('Finished Training')
    end_time = time.time()
    elapsed_time = end_time - start_time
    print("Total time elapsed: {:.2f} seconds".format(elapsed_time))

    # Plotting
    plt.title("Training Curve")
    plt.plot(iters, losses, label="Train")
    plt.xlabel("Iterations")
    plt.ylabel("Loss")
    plt.show()

    plt.title("Training Curve")
    plt.plot(range(1 ,num_epochs+1), train_acc, label="Train")
    plt.plot(range(1 ,num_epochs+1), val_acc, label="Validation")
    plt.xlabel("Epochs")
    plt.ylabel("Training Accuracy")
    plt.legend(loc='best')
    plt.show()

    print("Final Training Accuracy: {}".format(train_acc[-1]))
    print("Final Validation Accuracy: {}".format(val_acc[-1]))


small_data = torchvision.datasets.ImageFolder('./chen_1003912992/Cleaned', loader=plt.imread, transform=transform)


def get_accuracy_small(model, batch_size):
    data = small_data
    correct = 0
    total = 0
    for imgs, labels in torch.utils.data.DataLoader(data, batch_size=batch_size):
        
        
        #############################################
        # To Enable GPU Usage
        if use_cuda and torch.cuda.is_available():
          imgs = imgs.cuda()
          labels = labels.cuda()
        #############################################

        
        output = model(imgs)
        
        # Select index with maximum prediction score
        pred = output.max(1, keepdim=True)[1]
        correct += pred.eq(labels.view_as(pred)).sum().item()
        total += imgs.shape[0]
    return correct / total


def train_small(model, data, batch_size=27, learning_rate=0.001, num_epochs=200):
    torch.manual_seed(1000)
    train_loader = torch.utils.data.DataLoader(data, batch_size=batch_size, shuffle=True)
    criterion = nn.CrossEntropyLoss()
    optimizer = optim.SGD(model.parameters(), lr=learning_rate, momentum=0.9)

    iters, losses, train_acc = [], [], []

    # Training
    start_time = time.time()
    n = 0 # the number of iterations
    for epoch in range(num_epochs):
        for imgs, labels in iter(train_loader):
          
          
            #############################################
            # To Enable GPU Usage
            if use_cuda and torch.cuda.is_available():
              imgs = imgs.cuda()
              labels = labels.cuda()
            #############################################
            
              
            out = model(imgs)             # forward pass
            loss = criterion(out, labels) # compute the total loss
            loss.backward()               # backward pass (compute parameter updates)
            optimizer.step()              # make the updates for each parameter
            optimizer.zero_grad()         # a clean up step for PyTorch

            # Save the current training information
            iters.append(n)
            losses.append(float(loss)/batch_size)             # compute *average* loss
            train_acc.append(get_accuracy_small(model, batch_size)) # compute training accuracy 
            n += 1
        print(("Epoch {}: Train acc: {}").format(
                epoch + 1,
                train_acc[-1]))
    print('Finished Training')
    end_time = time.time()
    elapsed_time = end_time - start_time
    print("Total time elapsed: {:.2f} seconds".format(elapsed_time))

    # Plotting
    plt.title("Training Curve")
    plt.plot(iters, losses, label="Train")
    plt.xlabel("Iterations")
    plt.ylabel("Loss")
    plt.show()

    plt.title("Training Curve")
    plt.plot(iters, train_acc, label="Train")
    plt.xlabel("Iterations")
    plt.ylabel("Training Accuracy")
    plt.legend(loc='best')
    plt.show()

    print("Final Training Accuracy: {}".format(train_acc[-1]))


use_cuda = True

model = CNN()

if use_cuda and torch.cuda.is_available():
  model.cuda()
  print('CUDA is available!  Training on GPU ...')
else:
  print('CUDA is not available.  Training on CPU ...')
  
train_small(model, small_data, num_epochs=100)

CUDA is available!  Training on GPU ...
Epoch 1: Train acc: 0.1111111111111111
Epoch 2: Train acc: 0.1111111111111111
Epoch 3: Train acc: 0.1111111111111111
Epoch 4: Train acc: 0.1111111111111111
Epoch 5: Train acc: 0.1111111111111111
Epoch 6: Train acc: 0.1111111111111111
Epoch 7: Train acc: 0.1111111111111111
Epoch 8: Train acc: 0.1111111111111111
Epoch 9: Train acc: 0.1111111111111111
Epoch 10: Train acc: 0.1111111111111111
Epoch 11: Train acc: 0.1111111111111111
Epoch 12: Train acc: 0.1111111111111111
Epoch 13: Train acc: 0.1111111111111111
Epoch 14: Train acc: 0.1111111111111111
Epoch 15: Train acc: 0.1111111111111111
Epoch 16: Train acc: 0.1111111111111111
Epoch 17: Train acc: 0.1111111111111111
Epoch 18: Train acc: 0.1111111111111111
Epoch 19: Train acc: 0.1111111111111111
Epoch 20: Train acc: 0.1111111111111111
Epoch 21: Train acc: 0.1111111111111111
Epoch 22: Train acc: 0.1111111111111111
Epoch 23: Train acc: 0.1111111111111111
Epoch 24: Train acc: 0.1111111111111111
Epoch 25: Train acc: 0.1111111111111111
Epoch 26: Train acc: 0.1111111111111111
Epoch 27: Train acc: 0.1111111111111111
Epoch 28: Train acc: 0.1111111111111111
Epoch 29: Train acc: 0.14814814814814814
Epoch 30: Train acc: 0.14814814814814814
Epoch 31: Train acc: 0.14814814814814814
Epoch 32: Train acc: 0.14814814814814814
Epoch 33: Train acc: 0.14814814814814814
Epoch 34: Train acc: 0.14814814814814814
Epoch 35: Train acc: 0.14814814814814814
Epoch 36: Train acc: 0.14814814814814814
Epoch 37: Train acc: 0.14814814814814814
Epoch 38: Train acc: 0.14814814814814814
Epoch 39: Train acc: 0.18518518518518517
Epoch 40: Train acc: 0.18518518518518517
Epoch 41: Train acc: 0.18518518518518517
Epoch 42: Train acc: 0.2222222222222222
Epoch 43: Train acc: 0.2222222222222222
Epoch 44: Train acc: 0.2962962962962963
Epoch 45: Train acc: 0.2962962962962963
Epoch 46: Train acc: 0.2962962962962963
Epoch 47: Train acc: 0.2962962962962963
Epoch 48: Train acc: 0.2962962962962963
Epoch 49: Train acc: 0.2962962962962963
Epoch 50: Train acc: 0.3333333333333333
Epoch 51: Train acc: 0.3333333333333333
Epoch 52: Train acc: 0.4444444444444444
Epoch 53: Train acc: 0.5185185185185185
Epoch 54: Train acc: 0.5555555555555556
Epoch 55: Train acc: 0.5925925925925926
Epoch 56: Train acc: 0.6296296296296297
Epoch 57: Train acc: 0.6296296296296297
Epoch 58: Train acc: 0.5555555555555556
Epoch 59: Train acc: 0.5925925925925926
Epoch 60: Train acc: 0.5925925925925926
Epoch 61: Train acc: 0.6296296296296297
Epoch 62: Train acc: 0.6296296296296297
Epoch 63: Train acc: 0.6666666666666666
Epoch 64: Train acc: 0.6666666666666666
Epoch 65: Train acc: 0.6666666666666666
Epoch 66: Train acc: 0.6666666666666666
Epoch 67: Train acc: 0.6666666666666666
Epoch 68: Train acc: 0.6666666666666666
Epoch 69: Train acc: 0.6666666666666666
Epoch 70: Train acc: 0.6666666666666666
Epoch 71: Train acc: 0.6666666666666666
Epoch 72: Train acc: 0.6666666666666666
Epoch 73: Train acc: 0.7037037037037037
Epoch 74: Train acc: 0.8148148148148148
Epoch 75: Train acc: 0.8518518518518519
Epoch 76: Train acc: 0.8518518518518519
Epoch 77: Train acc: 0.8888888888888888
Epoch 78: Train acc: 0.9259259259259259
Epoch 79: Train acc: 0.9629629629629629
Epoch 80: Train acc: 0.9629629629629629
Epoch 81: Train acc: 0.9629629629629629
Epoch 82: Train acc: 1.0
Epoch 83: Train acc: 1.0
Epoch 84: Train acc: 1.0
Epoch 85: Train acc: 1.0
Epoch 86: Train acc: 1.0
Epoch 87: Train acc: 1.0
Epoch 88: Train acc: 1.0
Epoch 89: Train acc: 1.0
Epoch 90: Train acc: 1.0
Epoch 91: Train acc: 1.0
Epoch 92: Train acc: 1.0
Epoch 93: Train acc: 1.0
Epoch 94: Train acc: 1.0
Epoch 95: Train acc: 1.0
Epoch 96: Train acc: 1.0
Epoch 97: Train acc: 1.0
Epoch 98: Train acc: 1.0
Epoch 99: Train acc: 1.0
Epoch 100: Train acc: 1.0
Finished Training
Total time elapsed: 18.27 seconds

Final Training Accuracy: 1.0


use_cuda = True

model_1 = CNN()

if use_cuda and torch.cuda.is_available():
  model_1.cuda()
  print('CUDA is available!  Training on GPU ...')
else:
  print('CUDA is not available.  Training on CPU ...')

train(model_1, train_data)

CUDA is available!  Training on GPU ...
Epoch 1: Train acc: 0.32321428571428573 |Validation acc: 0.2991202346041056
Epoch 2: Train acc: 0.6042207792207792 |Validation acc: 0.5674486803519062
Epoch 3: Train acc: 0.6761363636363636 |Validation acc: 0.6451612903225806
Epoch 4: Train acc: 0.7417207792207792 |Validation acc: 0.7067448680351907
Epoch 5: Train acc: 0.7597402597402597 |Validation acc: 0.7331378299120235
Epoch 6: Train acc: 0.763474025974026 |Validation acc: 0.7463343108504399
Epoch 7: Train acc: 0.8051948051948052 |Validation acc: 0.7448680351906158
Epoch 8: Train acc: 0.813474025974026 |Validation acc: 0.7551319648093842
Epoch 9: Train acc: 0.7553571428571428 |Validation acc: 0.7023460410557185
Epoch 10: Train acc: 0.8292207792207792 |Validation acc: 0.7609970674486803
Epoch 11: Train acc: 0.8579545454545454 |Validation acc: 0.7991202346041055
Epoch 12: Train acc: 0.8392857142857143 |Validation acc: 0.7653958944281525
Epoch 13: Train acc: 0.8912337662337663 |Validation acc: 0.8137829912023461
Epoch 14: Train acc: 0.8964285714285715 |Validation acc: 0.7873900293255132
Epoch 15: Train acc: 0.850487012987013 |Validation acc: 0.7653958944281525
Epoch 16: Train acc: 0.9038961038961039 |Validation acc: 0.8284457478005866
Epoch 17: Train acc: 0.902435064935065 |Validation acc: 0.8079178885630498
Epoch 18: Train acc: 0.9152597402597402 |Validation acc: 0.8211143695014663
Epoch 19: Train acc: 0.9201298701298701 |Validation acc: 0.8196480938416423
Epoch 20: Train acc: 0.9086038961038961 |Validation acc: 0.8064516129032258
Epoch 21: Train acc: 0.9055194805194805 |Validation acc: 0.7947214076246334
Epoch 22: Train acc: 0.900487012987013 |Validation acc: 0.7947214076246334
Epoch 23: Train acc: 0.9313311688311688 |Validation acc: 0.8064516129032258
Epoch 24: Train acc: 0.9321428571428572 |Validation acc: 0.7991202346041055
Epoch 25: Train acc: 0.9415584415584416 |Validation acc: 0.8123167155425219
Epoch 26: Train acc: 0.9336038961038962 |Validation acc: 0.7961876832844574
Epoch 27: Train acc: 0.9454545454545454 |Validation acc: 0.8167155425219942
Epoch 28: Train acc: 0.9451298701298702 |Validation acc: 0.8181818181818182
Epoch 29: Train acc: 0.9587662337662337 |Validation acc: 0.8093841642228738
Epoch 30: Train acc: 0.962012987012987 |Validation acc: 0.8152492668621701
Finished Training
Total time elapsed: 1307.40 seconds

Final Training Accuracy: 0.962012987012987
Final Validation Accuracy: 0.8152492668621701


use_cuda = True

model_2 = CNN()

if use_cuda and torch.cuda.is_available():
  model_2.cuda()
  print('CUDA is available!  Training on GPU ...')
else:
  print('CUDA is not available.  Training on CPU ...')

train(model_2, train_data, batch_size=270)

CUDA is available!  Training on GPU ...
Epoch 1: Train acc: 0.15438311688311687 |Validation acc: 0.15102639296187684
Epoch 2: Train acc: 0.19886363636363635 |Validation acc: 0.19208211143695014
Epoch 3: Train acc: 0.23262987012987013 |Validation acc: 0.22140762463343108
Epoch 4: Train acc: 0.4314935064935065 |Validation acc: 0.41348973607038125
Epoch 5: Train acc: 0.5025974025974026 |Validation acc: 0.4706744868035191
Epoch 6: Train acc: 0.6108766233766234 |Validation acc: 0.5850439882697948
Epoch 7: Train acc: 0.6772727272727272 |Validation acc: 0.6466275659824047
Epoch 8: Train acc: 0.6931818181818182 |Validation acc: 0.6876832844574781
Epoch 9: Train acc: 0.7397727272727272 |Validation acc: 0.7111436950146628
Epoch 10: Train acc: 0.7477272727272727 |Validation acc: 0.7331378299120235
Epoch 11: Train acc: 0.7618506493506494 |Validation acc: 0.7331378299120235
Epoch 12: Train acc: 0.7797077922077922 |Validation acc: 0.7609970674486803
Epoch 13: Train acc: 0.7714285714285715 |Validation acc: 0.7565982404692082
Epoch 14: Train acc: 0.7917207792207792 |Validation acc: 0.7565982404692082
Epoch 15: Train acc: 0.8025974025974026 |Validation acc: 0.7551319648093842
Epoch 16: Train acc: 0.8017857142857143 |Validation acc: 0.7434017595307918
Epoch 17: Train acc: 0.8066558441558441 |Validation acc: 0.7756598240469208
Epoch 18: Train acc: 0.7920454545454545 |Validation acc: 0.7595307917888563
Epoch 19: Train acc: 0.826948051948052 |Validation acc: 0.7653958944281525
Epoch 20: Train acc: 0.8063311688311688 |Validation acc: 0.7565982404692082
Epoch 21: Train acc: 0.8235389610389611 |Validation acc: 0.7609970674486803
Epoch 22: Train acc: 0.8334415584415584 |Validation acc: 0.7756598240469208
Epoch 23: Train acc: 0.8428571428571429 |Validation acc: 0.7800586510263929
Epoch 24: Train acc: 0.8431818181818181 |Validation acc: 0.7741935483870968
Epoch 25: Train acc: 0.8498376623376623 |Validation acc: 0.7903225806451613
Epoch 26: Train acc: 0.8449675324675324 |Validation acc: 0.7683284457478006
Epoch 27: Train acc: 0.8599025974025974 |Validation acc: 0.7888563049853372
Epoch 28: Train acc: 0.8717532467532467 |Validation acc: 0.7903225806451613
Epoch 29: Train acc: 0.861525974025974 |Validation acc: 0.7771260997067448
Epoch 30: Train acc: 0.8733766233766234 |Validation acc: 0.7888563049853372
Finished Training
Total time elapsed: 1488.61 seconds

Final Training Accuracy: 0.8733766233766234
Final Validation Accuracy: 0.7888563049853372


class updated_CNN(nn.Module):
    def __init__(self):
        super(updated_CNN, self).__init__()
        self.name = "updated_cnn"
        self.conv1 = nn.Conv2d(3, 5, 3, stride=2, padding=1)
        self.pool = nn.MaxPool2d(2, 2)
        self.conv2 = nn.Conv2d(5, 5, 7, stride=2, padding=1)
        self.fc1 = nn.Linear(5 * 13 * 13, 32)
        self.fc2 = nn.Linear(32, 9)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = x.view(-1, 5 * 13 * 13)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        x = x.squeeze(1) # Flatten to [batch_size]
        return x


use_cuda = True

model_3 = updated_CNN()

if use_cuda and torch.cuda.is_available():
  model_3.cuda()
  print('CUDA is available!  Training on GPU ...')
else:
  print('CUDA is not available.  Training on CPU ...')

train(model_3, train_data, batch_size=27)

CUDA is available!  Training on GPU ...
Epoch 1: Train acc: 0.1564935064935065 |Validation acc: 0.1436950146627566
Epoch 2: Train acc: 0.36704545454545456 |Validation acc: 0.3284457478005865
Epoch 3: Train acc: 0.5657467532467533 |Validation acc: 0.5087976539589443
Epoch 4: Train acc: 0.649512987012987 |Validation acc: 0.6143695014662757
Epoch 5: Train acc: 0.6836038961038962 |Validation acc: 0.6627565982404692
Epoch 6: Train acc: 0.7133116883116883 |Validation acc: 0.6774193548387096
Epoch 7: Train acc: 0.7439935064935065 |Validation acc: 0.7008797653958945
Epoch 8: Train acc: 0.7573051948051948 |Validation acc: 0.7199413489736071
Epoch 9: Train acc: 0.7459415584415584 |Validation acc: 0.7126099706744868
Epoch 10: Train acc: 0.8017857142857143 |Validation acc: 0.7712609970674487
Epoch 11: Train acc: 0.8180194805194805 |Validation acc: 0.782991202346041
Epoch 12: Train acc: 0.8112012987012988 |Validation acc: 0.7947214076246334
Epoch 13: Train acc: 0.7996753246753247 |Validation acc: 0.7727272727272727
Epoch 14: Train acc: 0.8511363636363637 |Validation acc: 0.8152492668621701
Epoch 15: Train acc: 0.8217532467532468 |Validation acc: 0.7859237536656891
Epoch 16: Train acc: 0.8469155844155845 |Validation acc: 0.8108504398826979
Epoch 17: Train acc: 0.8618506493506494 |Validation acc: 0.8152492668621701
Epoch 18: Train acc: 0.8625 |Validation acc: 0.8343108504398827
Epoch 19: Train acc: 0.8668831168831169 |Validation acc: 0.8284457478005866
Epoch 20: Train acc: 0.8586038961038961 |Validation acc: 0.8299120234604106
Epoch 21: Train acc: 0.865909090909091 |Validation acc: 0.8196480938416423
Epoch 22: Train acc: 0.850487012987013 |Validation acc: 0.8064516129032258
Epoch 23: Train acc: 0.8813311688311688 |Validation acc: 0.8548387096774194
Epoch 24: Train acc: 0.8926948051948052 |Validation acc: 0.8504398826979472
Epoch 25: Train acc: 0.8823051948051948 |Validation acc: 0.8475073313782991
Epoch 26: Train acc: 0.8930194805194805 |Validation acc: 0.8519061583577713
Epoch 27: Train acc: 0.8936688311688312 |Validation acc: 0.843108504398827
Epoch 28: Train acc: 0.9008116883116883 |Validation acc: 0.8709677419354839
Epoch 29: Train acc: 0.900974025974026 |Validation acc: 0.8577712609970675
Epoch 30: Train acc: 0.9176948051948052 |Validation acc: 0.8548387096774194
Finished Training
Total time elapsed: 1280.51 seconds

Final Training Accuracy: 0.9176948051948052
Final Validation Accuracy: 0.8548387096774194


use_cuda = True

model_4 = updated_CNN()

if use_cuda and torch.cuda.is_available():
  model_4.cuda()
  print('CUDA is available!  Training on GPU ...')
else:
  print('CUDA is not available.  Training on CPU ...')

train(model_4, train_data, batch_size=270)

CUDA is available!  Training on GPU ...
Epoch 1: Train acc: 0.0836038961038961 |Validation acc: 0.08357771260997067
Epoch 2: Train acc: 0.09366883116883117 |Validation acc: 0.07917888563049853
Epoch 3: Train acc: 0.10113636363636364 |Validation acc: 0.08944281524926687
Epoch 4: Train acc: 0.1185064935064935 |Validation acc: 0.12023460410557185
Epoch 5: Train acc: 0.13133116883116883 |Validation acc: 0.12316715542521994
Epoch 6: Train acc: 0.13587662337662337 |Validation acc: 0.1378299120234604
Epoch 7: Train acc: 0.14545454545454545 |Validation acc: 0.14076246334310852
Epoch 8: Train acc: 0.14772727272727273 |Validation acc: 0.14516129032258066
Epoch 9: Train acc: 0.15487012987012988 |Validation acc: 0.15395894428152493
Epoch 10: Train acc: 0.1719155844155844 |Validation acc: 0.15689149560117302
Epoch 11: Train acc: 0.1943181818181818 |Validation acc: 0.17595307917888564
Epoch 12: Train acc: 0.24594155844155843 |Validation acc: 0.1935483870967742
Epoch 13: Train acc: 0.3146103896103896 |Validation acc: 0.24926686217008798
Epoch 14: Train acc: 0.36347402597402595 |Validation acc: 0.29765395894428154
Epoch 15: Train acc: 0.4108766233766234 |Validation acc: 0.3592375366568915
Epoch 16: Train acc: 0.4474025974025974 |Validation acc: 0.39002932551319647
Epoch 17: Train acc: 0.5212662337662337 |Validation acc: 0.4472140762463343
Epoch 18: Train acc: 0.5685064935064935 |Validation acc: 0.5
Epoch 19: Train acc: 0.5873376623376624 |Validation acc: 0.5410557184750733
Epoch 20: Train acc: 0.6277597402597402 |Validation acc: 0.593841642228739
Epoch 21: Train acc: 0.6563311688311688 |Validation acc: 0.6539589442815249
Epoch 22: Train acc: 0.6702922077922078 |Validation acc: 0.6612903225806451
Epoch 23: Train acc: 0.6821428571428572 |Validation acc: 0.6700879765395894
Epoch 24: Train acc: 0.6915584415584416 |Validation acc: 0.6759530791788856
Epoch 25: Train acc: 0.7064935064935065 |Validation acc: 0.7008797653958945
Epoch 26: Train acc: 0.7082792207792208 |Validation acc: 0.7111436950146628
Epoch 27: Train acc: 0.7147727272727272 |Validation acc: 0.7052785923753666
Epoch 28: Train acc: 0.7238636363636364 |Validation acc: 0.717008797653959
Epoch 29: Train acc: 0.7214285714285714 |Validation acc: 0.7360703812316716
Epoch 30: Train acc: 0.7314935064935065 |Validation acc: 0.7214076246334311
Finished Training
Total time elapsed: 1432.33 seconds

Final Training Accuracy: 0.7314935064935065
Final Validation Accuracy: 0.7214076246334311


def get_test_accuracy(model, batch_size):
    data = test_data
    correct = 0
    total = 0
    for imgs, labels in torch.utils.data.DataLoader(data, batch_size=batch_size):
        
        
        #############################################
        # To Enable GPU Usage
        if use_cuda and torch.cuda.is_available():
          imgs = imgs.cuda()
          labels = labels.cuda()
        #############################################

        
        output = model(imgs)
        
        # Select index with maximum prediction score
        pred = output.max(1, keepdim=True)[1]
        correct += pred.eq(labels.view_as(pred)).sum().item()
        total += imgs.shape[0]
    return correct / total


test_acc = get_test_accuracy(model_3, batch_size=27)
print("The test accuracy is", test_acc*100, "%.")

The test accuracy is 86.73740053050398 %.


import torchvision.models
alexnet = torchvision.models.alexnet(pretrained=True)


classes = ['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I']

def get_feature(data):
    if data == "train":
        data_loader = torch.utils.data.DataLoader(train_data, batch_size=1, shuffle=True)
    elif data == "val":
        data_loader = torch.utils.data.DataLoader(val_data, batch_size=1, shuffle=True)
    else:
        data_loader = torch.utils.data.DataLoader(test_data, batch_size=1, shuffle=True)
    n = 0
    for imgs, labels in iter(data_loader):
        features = alexnet.features(imgs)
        features_tensor = torch.from_numpy(features.detach().numpy())
        torch.save(features_tensor.squeeze(0), './AlexNet Features/' + data + '/' + classes[labels] + '/' + 'feature_bs1_' + str(n) + '.tensor')
        n += 1


get_feature("train")
get_feature("val")
get_feature("test")


# features = ... load precomputed alexnet.features(img) ...
output = model(features)
prob = F.softmax(output)


class transfer_CNN(nn.Module):
    def __init__(self):
        super(transfer_CNN, self).__init__()
        self.name = "transfer_cnn"
        self.conv1 = nn.Conv2d(256, 256, 3, padding=1)
        self.pool = nn.MaxPool2d(2, 2)
        self.fc1 = nn.Linear(256 * 3 * 3, 32)
        self.fc2 = nn.Linear(32, 9)

    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = x.view(-1, 256 * 3 * 3)
        x = F.relu(self.fc1(x))
        x = self.fc2(x)
        x = x.squeeze(1) # Flatten to [batch_size]
        return x


train_data_alexnet = torchvision.datasets.DatasetFolder('./AlexNet Features/train', loader=torch.load, extensions=('.tensor'))
val_data_alexnet = torchvision.datasets.DatasetFolder('./AlexNet Features/val', loader=torch.load, extensions=('.tensor'))
test_data_alexnet = torchvision.datasets.DatasetFolder('./AlexNet Features/test', loader=torch.load, extensions=('.tensor'))


def get_accuracy_transfer(model, batch_size, train=False):
    if train:
        data = train_data_alexnet
    else:
        data = val_data_alexnet
    correct = 0
    total = 0
    for imgs, labels in torch.utils.data.DataLoader(data, batch_size=batch_size):
        
        
        #############################################
        # To Enable GPU Usage
        if use_cuda and torch.cuda.is_available():
          imgs = imgs.cuda()
          labels = labels.cuda()
        #############################################

        
        output = model(imgs)
        
        # Select index with maximum prediction score
        pred = output.max(1, keepdim=True)[1]
        correct += pred.eq(labels.view_as(pred)).sum().item()
        total += imgs.shape[0]
    return correct / total


def transfer_train(model, data, batch_size=64, learning_rate=0.001, num_epochs=30):
    torch.manual_seed(1000)
    train_loader = torch.utils.data.DataLoader(data, batch_size=batch_size, shuffle=True)
    criterion = nn.CrossEntropyLoss()
    optimizer = optim.SGD(model.parameters(), lr=learning_rate, momentum=0.9)

    iters, losses, train_acc, val_acc = [], [], [], []

    # Training
    start_time = time.time()
    n = 0 # the number of iterations
    for epoch in range(num_epochs):
        for imgs, labels in iter(train_loader):
          
          
            #############################################
            # To Enable GPU Usage
            if use_cuda and torch.cuda.is_available():
              imgs = imgs.cuda()
              labels = labels.cuda()
            #############################################
            
              
            out = model(imgs)             # forward pass
            loss = criterion(out, labels) # compute the total loss
            loss.backward()               # backward pass (compute parameter updates)
            optimizer.step()              # make the updates for each parameter
            optimizer.zero_grad()         # a clean up step for PyTorch

            # Save the current training information
            iters.append(n)
            losses.append(float(loss)/batch_size)             # compute *average* loss
            n += 1
        train_acc.append(get_accuracy_transfer(model, batch_size=batch_size, train=True)) # compute training accuracy 
        val_acc.append(get_accuracy_transfer(model, batch_size=batch_size, train=False))  # compute validation accuracy
        print(("Epoch {}: Train acc: {} |"+"Validation acc: {}").format(
                epoch + 1,
                train_acc[-1],
                val_acc[-1]))
        # Save the current model (checkpoint) to a file
        model_path = get_model_name(model.name, batch_size, learning_rate, epoch)
        torch.save(model.state_dict(), model_path)
    print('Finished Training')
    end_time = time.time()
    elapsed_time = end_time - start_time
    print("Total time elapsed: {:.2f} seconds".format(elapsed_time))

    # Plotting
    plt.title("Training Curve")
    plt.plot(iters, losses, label="Train")
    plt.xlabel("Iterations")
    plt.ylabel("Loss")
    plt.show()

    plt.title("Training Curve")
    plt.plot(range(1 ,num_epochs+1), train_acc, label="Train")
    plt.plot(range(1 ,num_epochs+1), val_acc, label="Validation")
    plt.xlabel("Epochs")
    plt.ylabel("Training Accuracy")
    plt.legend(loc='best')
    plt.show()

    print("Final Training Accuracy: {}".format(train_acc[-1]))
    print("Final Validation Accuracy: {}".format(val_acc[-1]))


use_cuda = True

transfer_model = transfer_CNN()

if use_cuda and torch.cuda.is_available():
  transfer_model.cuda()
  print('CUDA is available!  Training on GPU ...')
else:
  print('CUDA is not available.  Training on CPU ...')

transfer_train(transfer_model, train_data_alexnet, batch_size=27, num_epochs=10)

CUDA is available!  Training on GPU ...
Epoch 1: Train acc: 0.8449675324675324 |Validation acc: 0.8592375366568915
Epoch 2: Train acc: 0.9170454545454545 |Validation acc: 0.9032258064516129
Epoch 3: Train acc: 0.9438311688311688 |Validation acc: 0.9281524926686217
Epoch 4: Train acc: 0.9564935064935065 |Validation acc: 0.9281524926686217
Epoch 5: Train acc: 0.9688311688311688 |Validation acc: 0.9457478005865103
Epoch 6: Train acc: 0.9775974025974026 |Validation acc: 0.9472140762463344
Epoch 7: Train acc: 0.9826298701298701 |Validation acc: 0.9589442815249267
Epoch 8: Train acc: 0.976461038961039 |Validation acc: 0.9457478005865103
Epoch 9: Train acc: 0.986525974025974 |Validation acc: 0.9574780058651027
Epoch 10: Train acc: 0.9913961038961039 |Validation acc: 0.9633431085043989
Finished Training
Total time elapsed: 129.52 seconds

Final Training Accuracy: 0.9913961038961039
Final Validation Accuracy: 0.9633431085043989


def get_transfer_test_accuracy(model, batch_size):
    data = test_data_alexnet
    correct = 0
    total = 0
    for imgs, labels in torch.utils.data.DataLoader(data, batch_size=batch_size):
        
        
        #############################################
        # To Enable GPU Usage
        if use_cuda and torch.cuda.is_available():
          imgs = imgs.cuda()
          labels = labels.cuda()
        #############################################

        
        output = model(imgs)
        
        # Select index with maximum prediction score
        pred = output.max(1, keepdim=True)[1]
        correct += pred.eq(labels.view_as(pred)).sum().item()
        total += imgs.shape[0]
    return correct / total


test_acc = get_transfer_test_accuracy(transfer_model, batch_size=27)
print("The test accuracy is", test_acc*100, "%.")

The test accuracy is 94.29708222811671 %.

Lab 3: Gesture Recognition using Convolutional Neural Networks¶

What to submit¶

Colab Link¶

Part A. Data Collection [10 pt]¶

American Sign Language¶

Generating Data¶

Cleaning Data¶

Accepted Images¶

Submission¶

Part B. Building a CNN [50 pt]¶

1. Data Loading and Splitting [10 pt]¶

2. Model Building and Sanity Checking [15 pt]¶

Part (a) Convolutional Network - 5 pt¶

Part (b) Training Code - 5 pt¶

Part (c) “Overfit” to a Small Dataset - 5 pt¶

3. Hyperparameter Search [10 pt]¶

Part (a) - 1 pt¶

Part (b) - 5 pt¶

Part (c) - 2 pt¶

Part (d) - 2 pt¶

4. Transfer Learning [15 pt]¶

Part (a) - 5 pt¶

Part (b) - 3 pt¶

Part (c) - 5 pt¶

Part (d) - 2 pt¶