Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Refactor training loop from script to class #65

Closed
wants to merge 3 commits into from
Closed
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
56 changes: 55 additions & 1 deletion README.md
Original file line number Diff line number Diff line change
@@ -1 +1,55 @@
# evals
# evals

This project now includes a new class `MNISTTrainer` which is used to train a model on the MNIST dataset.

## MNISTTrainer

The `MNISTTrainer` class is defined in `src/main.py`. It includes methods for loading and preprocessing the MNIST dataset, defining the model architecture, and training the model.

### Usage

An instance of `MNISTTrainer` is created and then its methods are used to load the data, define the model, and train the model. Here is an example:

```python
# Create an instance of MNISTTrainer
trainer = MNISTTrainer()

# Load the data
trainloader = trainer.load_data()

# Define the model
Net = trainer.define_model()
model = Net(trainloader)

# Train the model
optimizer = optim.SGD(model.parameters(), lr=0.01)
criterion = nn.NLLLoss()

# Training loop
epochs = 3
for epoch in range(epochs):
for images, labels in model.trainloader:
optimizer.zero_grad()
output = model(images)
loss = criterion(output, labels)
loss.backward()
optimizer.step()
```

The trained model is then saved and can be loaded in `src/api.py` using the `MNISTTrainer` class in a similar way:

```python
# Create an instance of MNISTTrainer
trainer = MNISTTrainer()

# Load the data
trainloader = trainer.load_data()

# Define the model
Net = trainer.define_model()
model = Net(trainloader)

# Load the model's state from the saved file
model.load_state_dict(torch.load("mnist_model.pth"))
model.eval()
```
15 changes: 12 additions & 3 deletions src/api.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,10 +2,19 @@
from PIL import Image
import torch
from torchvision import transforms
from main import Net # Importing Net class from main.py
from main import MNISTTrainer # Importing MNISTTrainer class from main.py

# Load the model
model = Net()
# Create an instance of MNISTTrainer
trainer = MNISTTrainer()

# Load the data
trainloader = trainer.load_data()

# Define the model
Net = trainer.define_model()
model = Net(trainloader)

# Load the model's state from the saved file
model.load_state_dict(torch.load("mnist_model.pth"))
model.eval()

Expand Down
65 changes: 40 additions & 25 deletions src/main.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,39 +6,54 @@
from torch.utils.data import DataLoader
import numpy as np

# Step 1: Load MNIST Data and Preprocess
transform = transforms.Compose([
transforms.ToTensor(),
transforms.Normalize((0.5,), (0.5,))
])
class MNISTTrainer:
def __init__(self):
self.transform = transforms.Compose([
transforms.ToTensor(),
transforms.Normalize((0.5,), (0.5,))
])

trainset = datasets.MNIST('.', download=True, train=True, transform=transform)
trainloader = DataLoader(trainset, batch_size=64, shuffle=True)
def load_data(self):
trainset = datasets.MNIST('.', download=True, train=True, transform=self.transform)
trainloader = DataLoader(trainset, batch_size=64, shuffle=True)
return trainloader

# Step 2: Define the PyTorch Model
class Net(nn.Module):
def __init__(self):
super().__init__()
self.fc1 = nn.Linear(28 * 28, 128)
self.fc2 = nn.Linear(128, 64)
self.fc3 = nn.Linear(64, 10)

def forward(self, x):
x = x.view(-1, 28 * 28)
x = nn.functional.relu(self.fc1(x))
x = nn.functional.relu(self.fc2(x))
x = self.fc3(x)
return nn.functional.log_softmax(x, dim=1)

# Step 3: Train the Model
model = Net()
def define_model(self):
class Net(nn.Module):
def __init__(self, trainloader):
super().__init__()
self.trainloader = trainloader
self.fc1 = nn.Linear(28 * 28, 128)
self.fc2 = nn.Linear(128, 64)
self.fc3 = nn.Linear(64, 10)

def forward(self, x):
x = x.view(-1, 28 * 28)
x = nn.functional.relu(self.fc1(x))
x = nn.functional.relu(self.fc2(x))
x = self.fc3(x)
return nn.functional.log_softmax(x, dim=1)

return Net

# Create an instance of MNISTTrainer
trainer = MNISTTrainer()

# Load the data
trainloader = trainer.load_data()

# Define the model
Net = trainer.define_model()
model = Net(trainloader)

# Train the model
optimizer = optim.SGD(model.parameters(), lr=0.01)
criterion = nn.NLLLoss()

# Training loop
epochs = 3
for epoch in range(epochs):
for images, labels in trainloader:
for images, labels in model.trainloader:
optimizer.zero_grad()
output = model(images)
loss = criterion(output, labels)
Expand Down
Loading