import os
import numpy as np
import matplotlib.pyplot as plt

try:
    import google.colab
    REPO_URL = "https://github.com/wtheisen/nd-cse-30124-homeworks.git"
    REPO_NAME = "nd-cse-30124-homeworks"
    LAB_FOLDER = "evidence/lab03"

    %cd /content/
    if not os.path.exists(REPO_NAME):
        !git clone {REPO_URL}

    %cd {REPO_NAME}/{LAB_FOLDER}

except ImportError:
    print("Not running on Colab - assuming local setup.")

import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.utils.data import TensorDataset, DataLoader

print(f"PyTorch version: {torch.__version__}")
print(f"NumPy version:   {np.__version__}")

# Device selection (GPU if available, otherwise CPU)
device = torch.device('cuda' if torch.cuda.is_available() else 'mps' if torch.backends.mps.is_available() else 'cpu')
print(f"Using device:    {device}")
print("Setup complete!")

/content
Cloning into 'nd-cse-30124-homeworks'...
remote: Enumerating objects: 721, done.
remote: Counting objects: 100% (137/137), done.
remote: Compressing objects: 100% (33/33), done.
remote: Total 721 (delta 127), reused 104 (delta 104), pack-reused 584 (from 1)
Receiving objects: 100% (721/721), 229.02 MiB | 29.01 MiB/s, done.
Resolving deltas: 100% (269/269), done.
Updating files: 100% (315/315), done.
/content/nd-cse-30124-homeworks/evidence/lab03
PyTorch version: 2.10.0+cpu
NumPy version:   2.0.2
Using device:    cpu
Setup complete!

# Load the EMNIST training data from the .npz file
data = np.load("emnist_balanced_small/emnist_balanced_small_train.npz")
images_np = data['X']       # shape: (n_samples, 28, 28), dtype: uint8
labels_np = data['y']       # shape: (n_samples,), dtype: int64

print(f"NumPy images: shape={images_np.shape}, dtype={images_np.dtype}")
print(f"NumPy labels: shape={labels_np.shape}, dtype={labels_np.dtype}")

# TODO: Flatten images to (n_samples, 784), normalize to [0, 1], convert to float32 tensor
images_tensor = None

# TODO: Convert labels to long tensor (required by CrossEntropyLoss)
labels_tensor = None

print(f"\nTensor images: shape={images_tensor.shape}, dtype={images_tensor.dtype}")
print(f"Tensor labels: shape={labels_tensor.shape}, dtype={labels_tensor.dtype}")
print(f"Pixel value range: [{images_tensor.min():.1f}, {images_tensor.max():.1f}]")

# Verify first few labels
print(f"\nFirst 10 labels: {labels_tensor[:10]}")

NumPy images: shape=(9400, 28, 28), dtype=uint8
NumPy labels: shape=(9400,), dtype=int64

Tensor images: shape=torch.Size([9400, 784]), dtype=torch.float32
Tensor labels: shape=torch.Size([9400]), dtype=torch.int64
Pixel value range: [0.0, 1.0]

First 10 labels: tensor([45, 45, 45, 45, 45, 45, 45, 45, 45, 45])

class SimpleClassifier(nn.Module):
    def __init__(self):
        super().__init__()
        self.fc = nn.Linear(784, 47)

    # TODO: Finish the forward pass of the simple classifier
    def forward(self, x):
        pass

# TODO: Create an instance of your neural network
model = None

print(model)

total_params = sum(p.numel() for p in model.parameters())
print(f"\nTotal parameters: {total_params:,}")

test_batch = images_tensor[:4]           # (4, 784)

# TODO: Test forward pass on first 4 samples
output = None

print(f"\nInput shape:  {test_batch.shape}")
print(f"Output shape: {output.shape}")

# Get predicted classes (these are random since the model is untrained)
predictions = torch.argmax(output, dim=1)
print(f"Predicted classes: {predictions}")
print(f"(These are random - the model hasn't been trained yet!)")

SimpleClassifier(
  (fc): Linear(in_features=784, out_features=47, bias=True)
)

Total parameters: 36,895

Input shape:  torch.Size([4, 784])
Output shape: torch.Size([4, 47])
Predicted classes: tensor([ 1, 24,  1, 26])
(These are random - the model hasn't been trained yet!)

from torch.utils.data import random_split

# TODO: Create TensorDataset from images and labels
full_dataset = None

print(f"Full dataset size: {len(full_dataset)}")

# TODO: Split into train (80%) and val (20%)
pass

train_dataset, val_dataset = random_split(full_dataset, [n_train, n_val])
print(f"Train: {len(train_dataset)}, Val: {len(val_dataset)}")

# TODO: Create DataLoaders with batch_size=64
train_loader = None
val_loader = None

# Print one batch to verify shapes
for batch_x, batch_y in train_loader:
    print(f"\nTraining batch: x={batch_x.shape}, y={batch_y.shape}")
    break

for batch_x, batch_y in val_loader:
    print(f"Validation batch: x={batch_x.shape}, y={batch_y.shape}")
    break

Full dataset size: 9400
Train: 7520, Val: 1880

Training batch: x=torch.Size([64, 784]), y=torch.Size([64])
Validation batch: x=torch.Size([64, 784]), y=torch.Size([64])

simple_model = SimpleClassifier()

# TODO: Create optimizer and loss function
optimizer = None
criterion = None

for epoch in range(5):
    simple_model.train()
    total_loss = 0

    for batch_x, batch_y in train_loader:
        # TODO: For each batch: Forward pass, calculate loss, reset gradients, backprop, gradient descent
        logits = None       # forward pass
        loss = None    # compute loss

        optimizer.zero_grad()                # reset gradients

        pass                      # compute gradients
        pass                     # update weights

        total_loss += loss.item()

    avg_loss = total_loss / len(train_loader)
    print(f"Epoch {epoch+1}/5: avg loss = {avg_loss:.4f}")

# Evaluate on validation set
simple_model.eval()
correct = 0
total = 0

with torch.no_grad():
    for batch_x, batch_y in val_loader:
        logits = simple_model(batch_x)
        predictions = torch.argmax(logits, dim=1)
        correct += (predictions == batch_y).sum().item()
        total += batch_y.size(0)

simple_accuracy = correct / total
print(f"\nSimple model validation accuracy: {simple_accuracy:.4f} ({correct}/{total})")

Epoch 1/5: avg loss = 2.7509
Epoch 2/5: avg loss = 1.8086
Epoch 3/5: avg loss = 1.5426
Epoch 4/5: avg loss = 1.4084
Epoch 5/5: avg loss = 1.3297

Simple model validation accuracy: 0.6223 (1170/1880)

# TODO: Finish the multi-layer FFN
class DeepClassifier(nn.Module):
    def __init__(self):
        super().__init__()
        pass

    def forward(self, x):
        pass

# TODO: Create an instance and print architecture
pass

total_params = sum(p.numel() for p in deep_model.parameters())
print(f"\nTotal parameters: {total_params:,}")

test_batch = images_tensor[:4]

# TODO: Test forward pass
pass

print(f"\nInput shape:  {test_batch.shape}")
print(f"Output shape: {output.shape}")

DeepClassifier(
  (fc1): Linear(in_features=784, out_features=256, bias=True)
  (fc2): Linear(in_features=256, out_features=128, bias=True)
  (fc3): Linear(in_features=128, out_features=47, bias=True)
)

Total parameters: 239,919

Input shape:  torch.Size([4, 784])
Output shape: torch.Size([4, 47])

# TODO: Train the deep model (same pattern as Task 04)
pass

for epoch in range(5):
    pass

# Evaluate on validation set
deep_model.eval()
correct = 0
total = 0

with torch.no_grad():
    for batch_x, batch_y in val_loader:
        logits = deep_model(batch_x)
        predictions = torch.argmax(logits, dim=1)
        correct += (predictions == batch_y).sum().item()
        total += batch_y.size(0)

deep_accuracy = correct / total
print(f"\nDeep model validation accuracy: {deep_accuracy:.4f} ({correct}/{total})")

# Compare
print(f"\n{'='*50}")
print(f"Simple model (1 layer):  {simple_accuracy:.4f}")
print(f"Deep model   (3 layers): {deep_accuracy:.4f}")
print(f"Improvement: {(deep_accuracy - simple_accuracy)*100:+.1f} percentage points")

Epoch 1/5: avg loss = 2.6217
Epoch 2/5: avg loss = 1.4934
Epoch 3/5: avg loss = 1.2616
Epoch 4/5: avg loss = 1.0890
Epoch 5/5: avg loss = 0.9510

Deep model validation accuracy: 0.6686 (1257/1880)

==================================================
Simple model (1 layer):  0.6223
Deep model   (3 layers): 0.6686
Improvement: +4.6 percentage points

import os, json

ASS_PATH = "nd-cse-30124-homeworks/labs"
ASS = "lab03"

try:
    from google.colab import _message, files

    repo_ipynb_path = f"/content/{ASS_PATH}/{ASS}/{ASS}.ipynb"

    nb = _message.blocking_request("get_ipynb", timeout_sec=1)["ipynb"]

    os.makedirs(os.path.dirname(repo_ipynb_path), exist_ok=True)
    with open(repo_ipynb_path, "w", encoding="utf-8") as f:
        json.dump(nb, f)

    !jupyter nbconvert --to html "{repo_ipynb_path}"
    files.download(repo_ipynb_path.replace(".ipynb", ".html"))
except:
    import subprocess

    nb_fp = os.getcwd() + f'/{ASS}.ipynb'
    print(os.getcwd())

    subprocess.run(["jupyter", "nbconvert", "--to", "html", nb_fp], check=True)
finally:
    print('[WARNING]: Unable to export notebook as .html')

[NbConvertApp] Converting notebook /content/nd-cse-30124-homeworks/labs/lab03/lab03.ipynb to html
[NbConvertApp] WARNING | Alternative text is missing on 1 image(s).
[NbConvertApp] Writing 355721 bytes to /content/nd-cse-30124-homeworks/labs/lab03/lab03.html

[WARNING]: Unable to export notebook as .html

Task ID	Description	Points
00	Setup	0
01	NumPy ↔ Tensor Conversion	1
02	Define a Single-Layer Classifier	0.5
03	Create a DataLoader	1
04	Train the Single-Layer Model	0.5
05	Build a Multi-Layer FFN	1
06	Train and Compare	1
07	Generate Police Report	0

CSE 30124 - Introduction to Artificial Intelligence: Lab 03 (5 pts.)¶

Story Progression¶

Task 00: Setup (0 pts.)¶

Task 00: Code (0 pts.)¶

Task 01: NumPy ↔ Tensor Conversion (1 pt.)¶

Task 01: Code (1 pt.)¶

Task 01: Expected Output (1 pt.)¶

Story Progression¶

Task 02: Define a Single-Layer Classifier (0.5 pts.)¶

Task 02: Code (0.5 pts.)¶

Task 02: Expected Output (0.5 pts.)¶

Story Progression¶

Task 03: Create a DataLoader (1 pt.)¶

Task 03: Code (1 pt.)¶

Task 03: Expected Output (1 pt.)¶

Story Progression¶

Task 04: Train the Single-Layer Model (0.5 pts.)¶

Task 04: Code (0.5 pts.)¶

Task 04: Expected Output (0.5 pts.)¶

Story Progression¶

Task 05: Build a Multi-Layer FFN (1 pt.)¶

Task 05: Code (1 pt.)¶

Task 05: Expected Output (1 pt.)¶

Story Progression¶

Task 06: Train and Compare (1 pt.)¶

Task 06: Code (1 pt.)¶

Task 06: Expected Output (0.5 pts.)¶

Task 06: Short Answer (0.5 pts.)¶

Story Progression¶

Task 07: Generate Police Report (0 pts.)¶

Task 07: Code (0 pts.)¶