https://github.com/elaheghiyabi96/fashion_mnist_nn_torch

"Simple neural network model using Torch for classifying the Fashion MNIST dataset, implemented with Torch."
https://github.com/elaheghiyabi96/fashion_mnist_nn_torch

adam-optimizer cross-entropy-loss deep-learning dropout fashion-mnist feedforward-neural-network image-classification machine-learning model-evaluation model-training neural-network pytorch relu-activation test-accuracy training-loss

Last synced: 2 months ago
JSON representation

"Simple neural network model using Torch for classifying the Fashion MNIST dataset, implemented with Torch."

Host: GitHub
URL: https://github.com/elaheghiyabi96/fashion_mnist_nn_torch
Owner: elaheghiyabi96
Created: 2025-05-05T16:31:11.000Z (6 months ago)
Default Branch: main
Last Pushed: 2025-05-05T16:37:16.000Z (6 months ago)
Last Synced: 2025-06-05T11:47:40.722Z (5 months ago)
Topics: adam-optimizer, cross-entropy-loss, deep-learning, dropout, fashion-mnist, feedforward-neural-network, image-classification, machine-learning, model-evaluation, model-training, neural-network, pytorch, relu-activation, test-accuracy, training-loss
Language: Jupyter Notebook
Homepage:
Size: 44.9 KB
Stars: 0
Watchers: 1
Forks: 0
Open Issues: 0
Metadata Files:
- Readme: README.md

Awesome Lists containing this project

README

          # fashion_mnist_nn_torch

"Simple neural network model using Torch for classifying the Fashion MNIST dataset, implemented with Torch."

In this code, we implemented a simple neural network using PyTorch to classify the Fashion MNIST dataset.

The dataset consists of grayscale images of 28x28 pixels representing different clothing items. 

The model architecture consists of three fully connected layers with ReLU activation functions and dropout layers for regularization. 

The first layer flattens the 28x28 images into a 1D vector of 784 features, followed by a fully connected layer of 128 neurons. 

The second layer has 256 neurons, and the third has 64 neurons. 

The final output layer has 10 neurons corresponding to the 10 classes in the Fashion MNIST dataset. 

The network is trained using the Adam optimizer with cross-entropy loss, and we evaluate its performance on the test dataset after 15 epochs of training. 

After training, the model achieved an accuracy of 87.67% on the test set.

import torch

import torch.nn as nn

import torch.optim as optim

from torchvision import datasets, transforms

from torch.utils.data import DataLoader

import matplotlib.pyplot as plt

# Select device: use GPU if available, otherwise fallback to CPU

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

print(f"Using device: {device}")

# Data preprocessing: convert images to tensors

transform = transforms.Compose([transforms.ToTensor()])

# Load the FashionMNIST dataset for training and testing

train_data = datasets.FashionMNIST(root='./data', train=True, download=True, transform=transform)

test_data = datasets.FashionMNIST(root='./data', train=False, download=True, transform=transform)

# Create data loaders for batching and shuffling

train_loader = DataLoader(train_data, batch_size=32, shuffle=True)

test_loader = DataLoader(test_data, batch_size=32, shuffle=False)

# Define a feedforward neural network with 3 hidden layers and dropout

class SimpleNN(nn.Module):

    def __init__(self):

        super(SimpleNN, self).__init__()

        self.fc1 = nn.Linear(28 * 28, 128)       # First hidden layer (input: 784 → output: 128)

        self.relu1 = nn.ReLU()

        self.dropout1 = nn.Dropout(0.3)

        self.fc2 = nn.Linear(128, 256)           # Second hidden layer (128 → 256)

        self.relu2 = nn.ReLU()

        self.dropout2 = nn.Dropout(0.3)

        self.fc3 = nn.Linear(256, 64)            # Third hidden layer (256 → 64)

        self.relu3 = nn.ReLU()

        self.dropout3 = nn.Dropout(0.3)

        self.fc4 = nn.Linear(64, 10)             # Output layer (64 → 10 classes)

    def forward(self, x):

        x = x.view(-1, 28 * 28)                  # Flatten input image from 1x28x28 to 784

        x = self.fc1(x)

        x = self.relu1(x)

        x = self.dropout1(x)

        x = self.fc2(x)

        x = self.relu2(x)

        x = self.dropout2(x)

        x = self.fc3(x)

        x = self.relu3(x)

        x = self.dropout3(x)

        x = self.fc4(x)

        return x

# Initialize model, loss function, and optimizer

model = SimpleNN().to(device)

criterion = nn.CrossEntropyLoss()                               # Suitable for multi-class classification

optimizer = optim.Adam(model.parameters(), lr=0.001, weight_decay=1e-5)

# Lists to store loss values for plotting

train_losses = []

test_losses = []

# Training loop for 15 epochs

for epoch in range(15):

    model.train()                                # Set model to training mode

    total_loss = 0

    for images, labels in train_loader:

        images, labels = images.to(device), labels.to(device)

        optimizer.zero_grad()                    # Clear previous gradients

        outputs = model(images)                  # Forward pass

        loss = criterion(outputs, labels)        # Compute loss

        loss.backward()                          # Backward pass

        optimizer.step()                         # Update model weights

        total_loss += loss.item()

    avg_train_loss = total_loss / len(train_loader)

    train_losses.append(avg_train_loss)

    # Evaluate model on test set

    model.eval()

    test_loss = 0

    with torch.no_grad():                        # No need to compute gradients

        for images, labels in test_loader:

            images, labels = images.to(device), labels.to(device)

            outputs = model(images)

            loss = criterion(outputs, labels)

            test_loss += loss.item()

    avg_test_loss = test_loss / len(test_loader)

    test_losses.append(avg_test_loss)

    print(f"Epoch {epoch+1}/15, Train Loss: {avg_train_loss:.4f}, Test Loss: {avg_test_loss:.4f}")

# Final evaluation on the test dataset

model.eval()

correct = 0

total = 0

with torch.no_grad():

    for images, labels in test_loader:

        images, labels = images.to(device), labels.to(device)

        outputs = model(images)

        _, predicted = torch.max(outputs, 1)     # Choose class with highest probability

        total += labels.size(0)

        correct += (predicted == labels).sum().item()

accuracy = 100 * correct / total

print(f"Test Accuracy: {accuracy:.2f}%")

# Plot training and test loss curves

plt.plot(train_losses, label='Train Loss')

plt.plot(test_losses, label='Test Loss')

plt.xlabel('Epoch')

plt.ylabel('Loss')

plt.legend()

plt.title('Train vs Test Loss')

plt.grid(True)

plt.show()

# Display a specific test image and its prediction

import numpy as np

# Get image and label at index 100

index = 100

image, label = test_data[index]

# Move model to eval mode and disable gradients

model.eval()

with torch.no_grad():

    input_image = image.unsqueeze(0).to(device)  # Add batch dimension and send to device

    output = model(input_image)

    predicted_class = output.argmax(dim=1).item()

# Class names for FashionMNIST

class_names = ['T-shirt/top', 'Trouser', 'Pullover', 'Dress', 'Coat',

               'Sandal', 'Shirt', 'Sneaker', 'Bag', 'Ankle boot']

# Print actual and predicted classes

print("True label:", class_names[label])

print("Predicted label:", class_names[predicted_class])

# Plot the image

plt.imshow(np.squeeze(image), cmap='gray')

plt.title(f"True: {class_names[label]}, Predicted: {class_names[predicted_class]}")

plt.axis('off')

plt.show()

ecosyste.ms

Data

Tools

Indexes

Applications

Experiments

Awesome

https://github.com/elaheghiyabi96/fashion_mnist_nn_torch

Awesome Lists containing this project

README