import torch
import torch.optim as optim
import torch.nn.functional as F
import torchvision
import torchvision.datasets as datasets
import torchvision.models as models
import torchvision.transforms as transforms

!unzip -qf dataset.zip

dataset = datasets.ImageFolder(
    'dataset',
    transforms.Compose([
        transforms.ColorJitter(0.1, 0.1, 0.1, 0.1),
        transforms.Resize((224, 224)),
        transforms.ToTensor(),
        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225])
    ])
)

train_dataset, test_dataset = torch.utils.data.random_split(dataset, [len(dataset) - 50, 50])

train_loader = torch.utils.data.DataLoader(
    train_dataset,
    batch_size=8,
    shuffle=True,
    num_workers=0,
)

test_loader = torch.utils.data.DataLoader(
    test_dataset,
    batch_size=8,
    shuffle=True,
    num_workers=0,
)

model = models.resnet18(weights='DEFAULT')

model.fc = torch.nn.Linear(512, 2)

device = torch.device('cuda')
model = model.to(device)

NUM_EPOCHS = 30
BEST_MODEL_PATH = 'best_model_resnet18.pth'
best_accuracy = 0.0

optimizer = optim.SGD(model.parameters(), lr=0.001, momentum=0.9)

for epoch in range(NUM_EPOCHS):
    
    for images, labels in iter(train_loader):
        images = images.to(device)
        labels = labels.to(device)
        optimizer.zero_grad()
        outputs = model(images)
        loss = F.cross_entropy(outputs, labels)
        loss.backward()
        optimizer.step()
    
    test_error_count = 0.0
    for images, labels in iter(test_loader):
        images = images.to(device)
        labels = labels.to(device)
        outputs = model(images)
        test_error_count += float(torch.sum(torch.abs(labels - outputs.argmax(1))))
    
    test_accuracy = 1.0 - float(test_error_count) / float(len(test_dataset))
    print('%d: %f' % (epoch, test_accuracy))
    if test_accuracy > best_accuracy:
        torch.save(model.state_dict(), BEST_MODEL_PATH)
        best_accuracy = test_accuracy

/usr/local/lib/python3.10/dist-packages/torchvision/transforms/_functional_pil.py:113: RuntimeWarning: invalid value encountered in cast
  np_h += np.array(hue_factor * 255).astype(np.uint8)

0: 0.940000
1: 0.840000
2: 0.920000
3: 0.960000
4: 0.920000
5: 0.900000
6: 0.900000
7: 0.900000
8: 0.980000
9: 0.980000
10: 0.860000
11: 0.960000
12: 0.980000
13: 0.980000
14: 1.000000
15: 1.000000
16: 1.000000
17: 0.980000
18: 0.960000
19: 0.940000
20: 0.960000
21: 0.880000
22: 0.940000
23: 0.960000
24: 0.960000
25: 0.940000
26: 0.980000
27: 0.960000
28: 0.980000
29: 0.920000

Collision Avoidance - Train Model (ResNet18)¶

Upload and extract dataset¶

Create dataset instance¶

Split dataset into train and test sets¶

Create data loaders to load data in batches¶

Define the neural network¶

Train the neural network¶