%matplotlib inline  # Enable inline plotting in notebook
%config InlineBackend.figure_format = 'retina'

import matplotlib.pyplot as plt  # Import matplotlib for visualization

import torch  # Import PyTorch library
from torch import nn  # Import neural network module
from torch import optim
import torch.nn.functional as F  # Import functional API (F.relu, etc.)
from torchvision import datasets, transforms  # Import datasets and image transforms

import helper  # Import helper visualization functions
import fc_model  # Import pre-built fully connected model

# Define a transform to normalize the data
transform = transforms.Compose([transforms.ToTensor(),  # Define transform: convert to tensor
                                transforms.Normalize((0.5,), (0.5,))])
# Download and load the training data
trainset = datasets.FashionMNIST('~/.pytorch/F_MNIST_data/', download=True, train=True, transform=transform)  # Download/load Fashion-MNIST training data
trainloader = torch.utils.data.DataLoader(trainset, batch_size=64, shuffle=True)  # Create training data loader

# Download and load the test data
testset = datasets.FashionMNIST('~/.pytorch/F_MNIST_data/', download=True, train=False, transform=transform)  # Download/load Fashion-MNIST test data
testloader = torch.utils.data.DataLoader(testset, batch_size=64, shuffle=True)  # Create test data loader

image, label = next(iter(trainloader))  # Get one batch of images and labels
helper.imshow(image[0,:]);

# Create the network, define the criterion and optimizer

model = fc_model.Network(784, 10, [512, 256, 128])
criterion = nn.NLLLoss()  # Negative log-likelihood loss
optimizer = optim.Adam(model.parameters(), lr=0.001)  # Adam optimizer

fc_model.train(model, trainloader, testloader, criterion, optimizer, epochs=2)  # Train the model

print("Our model: \n\n", model, '\n')
print("The state dict keys: \n\n", model.state_dict().keys())

torch.save(model.state_dict(), 'checkpoint.pth')  # Save model checkpoint

state_dict = torch.load('checkpoint.pth',weights_only=True)  # Load model checkpoint
print(state_dict.keys())  # Print layer names in state dict

model.load_state_dict(state_dict)  # Load saved model weights

# Try this
model = fc_model.Network(784, 10, [400, 200, 100])
# This will throw an error because the tensor sizes are wrong!
model.load_state_dict(state_dict)  # Load saved model weights

checkpoint = {'input_size': 784,  # Create checkpoint dict
              'output_size': 10,  # Output size
              'hidden_layers': [each.out_features for each in model.hidden_layers],  # Hidden layer sizes
              'state_dict': model.state_dict()}  # Model weights

torch.save(checkpoint, 'checkpoint.pth')  # Save model checkpoint

def load_checkpoint(filepath):
    checkpoint = torch.load(filepath,weights_only=True)  # Load model checkpoint
    model = fc_model.Network(checkpoint['input_size'],
                             checkpoint['output_size'],
                             checkpoint['hidden_layers'])  # End of transforms list
    model.load_state_dict(checkpoint['state_dict'])  # End of transforms list
    
    return model  # Return loaded model

model = load_checkpoint('checkpoint.pth')
print(model)  # Display model architecture

Saving and Loading Models¶

Train a network¶

Saving and loading networks¶