!python --version # check what version of Python bash commands use

import sys # check what version of Python the Python cells use
sys.version

!pip3 check torch # check that torch is installed - it should be!

# Mount your Google Drive - will show up in the folder 'drive'
from google.colab import drive
drive.mount('/content/drive') # this line will produce a pop-up

# List the contents of your Google Drive.
!ls "/content/drive/My Drive/"

from sklearn.datasets import load_iris

data = load_iris()
data['data'].shape, data['target'].shape

((150, 4), (150,))

print(data['data'].shape)
data['data'][:5] # look at 5 iris' measurements

(150, 4)

array([[5.1, 3.5, 1.4, 0.2],
       [4.9, 3. , 1.4, 0.2],
       [4.7, 3.2, 1.3, 0.2],
       [4.6, 3.1, 1.5, 0.2],
       [5. , 3.6, 1.4, 0.2]])

print('instances:', data['target'].shape)
print('number of unique classes:', len(set(data['target'])))
data['target'][:5] # first 5 are all class 0 (Setosa)

instances: (150,)
number of unique classes: 3

array([0, 0, 0, 0, 0])

import torch
from torch import nn
from torch.nn import functional as F

class Net(nn.Module):
    def __init__(self):

        # do whatever must be done for an nn.Module
        super(Net, self).__init__()

        # 4D input, 3D output
        self.linear = nn.Linear(4, 3)

    def forward(self, x):

        # just pass the input through the linear layer
        return self.linear(x)

torch.manual_seed(42)

model = Net() # make an instance of the Net class we just wrote
model # take a look

Net(
  (linear): Linear(in_features=4, out_features=3, bias=True)
)

s = 0

# iterate over model's parameters
for name, param in model.named_parameters():
    print(name, param.shape)
    print(param, '\n\n\n')
    s += param.numel() # count elements in a tensor
print('total parameters:', s)

linear.weight torch.Size([3, 4])
Parameter containing:
tensor([[ 0.3823,  0.4150, -0.1171,  0.4593],
        [-0.1096,  0.1009, -0.2434,  0.2936],
        [ 0.4408, -0.3668,  0.4346,  0.0936]], requires_grad=True) 


linear.bias torch.Size([3])
Parameter containing:
tensor([0.3694, 0.0677, 0.2411], requires_grad=True) 


total parameters: 15

class DeepNet(nn.Module):
    def __init__(self):

        # do whatever must be done for an nn.Module
        super(DeepNet, self).__init__()

        # 4D input, 3D output
        self.linear1 = nn.Linear(4, 8) # 8 is arbitrary
        self.linear2 = nn.Linear(8, 3) # must match here

    def forward(self, x):

        # pass through first layer
        x = self.linear1(x)

        # activation function, ReLU
        x = F.relu(x)

        # pass through second layer
        x = self.linear2(x)

        return x

deep_model = DeepNet()
deep_model

DeepNet(
  (linear1): Linear(in_features=4, out_features=8, bias=True)
  (linear2): Linear(in_features=8, out_features=3, bias=True)
)

s = 0

# iterate over model's parameters
for name, param in deep_model.named_parameters():
    print(name, param.shape)
    print(param, end='\n\n')
    s += param.numel() # count elements in a tensor
print('total parameters:', s)

linear1.weight torch.Size([8, 4])
Parameter containing:
tensor([[-0.0706,  0.3854,  0.0739, -0.2334],
        [ 0.1274, -0.2304, -0.0586, -0.2031],
        [ 0.3317, -0.3947, -0.2305, -0.1412],
        [-0.3006,  0.0472, -0.4938,  0.4516],
        [-0.4247,  0.3860,  0.0832, -0.1624],
        [ 0.3090,  0.0779,  0.4040,  0.0547],
        [-0.1577,  0.1343, -0.1356,  0.2104],
        [ 0.4464,  0.2890, -0.2186,  0.2886]], requires_grad=True)

linear1.bias torch.Size([8])
Parameter containing:
tensor([ 0.0895,  0.2539, -0.3048, -0.4950, -0.1932, -0.3835,  0.4103,  0.1440],
       requires_grad=True)

linear2.weight torch.Size([3, 8])
Parameter containing:
tensor([[ 0.1464,  0.1118, -0.0062,  0.2767, -0.2512,  0.0223, -0.2413,  0.1090],
        [-0.1218,  0.1083, -0.0737,  0.2932, -0.2096, -0.2109, -0.2109,  0.3180],
        [ 0.1178,  0.3402, -0.2918, -0.3507, -0.2766, -0.2378,  0.1432,  0.1266]],
       requires_grad=True)

linear2.bias torch.Size([3])
Parameter containing:
tensor([ 0.2938, -0.1826, -0.2410], requires_grad=True)

total parameters: 67

tensor_data = torch.Tensor(data['data'])
print('data shape:', tensor_data.shape)
print('\nsome rows in our data:', tensor_data[50:55], sep='\n')

data shape: torch.Size([150, 4])

some rows in our data:
tensor([[7.0000, 3.2000, 4.7000, 1.4000],
        [6.4000, 3.2000, 4.5000, 1.5000],
        [6.9000, 3.1000, 4.9000, 1.5000],
        [5.5000, 2.3000, 4.0000, 1.3000],
        [6.5000, 2.8000, 4.6000, 1.5000]])

 # calling a model calls its forward() method
input_tensor = tensor_data[50]
output_tensor = deep_model(input_tensor)
print('input:', input_tensor, sep='\n')
print('input shape:', input_tensor.shape, end='\n\n')
print('output:', output_tensor, sep='\n')
print('output shape:', output_tensor.shape)
print('\nprediction:', output_tensor.argmax().item())
print('    target:', data['target'][50])

input:
tensor([7.0000, 3.2000, 4.7000, 1.4000])
input shape: torch.Size([4])

output:
tensor([ 0.8965,  0.0052, -0.6412], grad_fn=<ViewBackward0>)
output shape: torch.Size([3])

prediction: 0
    target: 1

batched_input_tensor = tensor_data[50:55]
batched_output_tensor = deep_model(batched_input_tensor)
print('input:', batched_input_tensor, sep='\n')
print('input shape:', batched_input_tensor.shape, end='\n\n')
print('output:', batched_output_tensor, sep='\n')
print('output shape:', batched_output_tensor.shape)
print('\nprediction:', batched_output_tensor.argmax(dim=1).numpy())
print('    target:', data['target'][50:55])

input:
tensor([[7.0000, 3.2000, 4.7000, 1.4000],
        [6.4000, 3.2000, 4.5000, 1.5000],
        [6.9000, 3.1000, 4.9000, 1.5000],
        [5.5000, 2.3000, 4.0000, 1.3000],
        [6.5000, 2.8000, 4.6000, 1.5000]])
input shape: torch.Size([5, 4])

output:
tensor([[ 0.8965,  0.0052, -0.6412],
        [ 0.8701, -0.0025, -0.6034],
        [ 0.8821, -0.0281, -0.6684],
        [ 0.7510, -0.0449, -0.5795],
        [ 0.8383, -0.0217, -0.6428]], grad_fn=<AddmmBackward0>)
output shape: torch.Size([5, 3])

prediction: [0 0 0 0 0]
    target: [1 1 1 1 1]

trained_weights_path = 'path/to/model/iris_model.pt'

deep_model.load_state_dict(
    torch.load(trained_weights_path)
)
batched_output_tensor = deep_model(batched_input_tensor)
print('prediction:', batched_output_tensor.argmax(dim=1).numpy())
print('    target:', data['target'][50:55])

# move the input and model to GPU for speed if available
device = 'cuda' if torch.cuda.is_available() else 'cpu'
input_tensor = input_tensor.to(device) # out of place - must reassign with =
model.to(device) # models can be done in place
output = model(input_tensor)
output

print(next(model.parameters()).device)
input_tensor.device

deep_model.train()

deep_model.eval()

with torch.no_grad():
    output = deep_model(input_tensor)
output

from sklearn.datasets import load_digits

# YOUR CODE HERE

from sklearn.datasets import load_iris

data = load_iris()
data['data'].shape, data['target'].shape

((150, 4), (150,))

X = torch.tensor(data['data'])
y = torch.tensor(data['target'])

# hold out rows 50-55
X_test = X[50:55]
y_test = y[50:55]

X_train = torch.cat((X[:50], X[55:]))
y_train = torch.cat((y[:50], y[55:]))

crit = nn.CrossEntropyLoss()
opt = torch.optim.SGD(model.parameters(), lr=0.1)

for i in range(1000):
    opt.zero_grad()
    loss = crit(model(X_train.float()), y_train.long())
    loss.backward()
    opt.step()

model(X_test.float()).argmax(dim=1).tolist(), y_test.tolist()

([1, 1, 1, 1, 1], [1, 1, 1, 1, 1])

torch.save(model.state_dict(), 'iris_model.pt')

Notebook 1 - Getting Started with PyTorch on Colab¶

Basic Colab Usage¶

Mounting your Google Drive¶

Data¶

Writing a model¶

Forward pass¶

Hardware considerations¶

Training vs inference practices¶

More practice (if time)¶

Bonus¶