WUT_Computer_Science/lab5/code/main.py

92 lines
2.7 KiB
Python
Raw Normal View History

2023-05-13 12:45:54 +02:00
import torch
import torch.nn as nn
import torch.optim as optim
2023-05-13 13:47:48 +02:00
from torchvision import datasets, transforms
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Set random seed for reproducibility
torch.manual_seed(42)
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Define hyperparameters
learning_rate = 0.001
batch_size = 64
num_epochs = 10
input_size = 28 * 28 # MNIST images are 28x28 pixels
hidden_size = 128
num_classes = 10
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Load MNIST dataset and apply transformations
train_dataset = datasets.MNIST(
root='./data', train=True, transform=transforms.ToTensor(), download=True
)
test_dataset = datasets.MNIST(
root='./data', train=False, transform=transforms.ToTensor(), download=True
)
2023-05-13 13:26:38 +02:00
2023-05-13 13:47:48 +02:00
# Create data loaders
train_loader = torch.utils.data.DataLoader(
dataset=train_dataset, batch_size=batch_size, shuffle=True
)
test_loader = torch.utils.data.DataLoader(
dataset=test_dataset, batch_size=batch_size, shuffle=False
)
2023-05-13 13:26:38 +02:00
2023-05-13 13:47:48 +02:00
# Define the multilayer perceptron model
model = nn.Sequential(
nn.Linear(input_size, hidden_size),
nn.ReLU(),
nn.Linear(hidden_size, num_classes)
)
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Loss function
criterion = nn.CrossEntropyLoss()
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Optimizer
optimizer = optim.Adam(model.parameters(), lr=learning_rate)
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Training loop
for epoch in range(num_epochs):
for batch_idx, (data, targets) in enumerate(train_loader):
# Reshape the input data
data = data.view(data.size(0), -1)
# Forward pass
outputs = model(data)
loss = criterion(outputs, targets)
# Backward pass and optimization
2023-05-13 12:45:54 +02:00
optimizer.zero_grad()
loss.backward()
optimizer.step()
2023-05-13 13:47:48 +02:00
# Print loss value for every learning step
if (batch_idx+1) % 100 == 0:
print(f'Epoch [{epoch+1}/{num_epochs}], Step [{batch_idx+1}/{len(train_loader)}], Loss: {loss.item():.4f}')
# Calculate accuracy on train set after each epoch
correct = 0
total = 0
for data, targets in train_loader:
data = data.view(data.size(0), -1)
outputs = model(data)
_, predicted = torch.max(outputs.data, 1)
total += targets.size(0)
correct += (predicted == targets).sum().item()
train_accuracy = 100 * correct / total
print(f'Accuracy on Train Set after Epoch {epoch+1}: {train_accuracy:.2f}%')
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Calculate accuracy on validation set after each epoch
correct = 0
total = 0
for data, targets in test_loader:
data = data.view(data.size(0), -1)
outputs = model(data)
_, predicted = torch.max(outputs.data, 1)
total += targets.size(0)
correct += (predicted == targets).sum().item()
validation_accuracy = 100 * correct / total
print(f'Accuracy on Validation Set after Epoch {epoch+1}: {validation_accuracy:.2f}%')
print('---')
2023-05-13 12:45:54 +02:00
2023-05-13 13:47:48 +02:00
# Conclusions and observations can be included in the report