0% found this document useful (0 votes)

53 views29 pages

Vehicle Type Recognition with Deep Learning

The document outlines a machine learning project for vehicle type recognition using three different neural network architectures: AlexNet, VGG16, and LeNet. It includes steps for dataset preparation, model training, and evaluation, reporting accuracy, precision, recall, and F1-score for each model. The results indicate varying performance, with AlexNet achieving 22.50% accuracy, VGG16 at 26.67%, and LeNet's performance is yet to be fully summarized.

Uploaded by

sadianazim395

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

53 views29 pages

Vehicle Type Recognition with Deep Learning

Uploaded by

sadianazim395

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

Name:Muhammad Hermen Khan

Enroll:01-136221-054

BS-AI-6A

Dataset Link:[Link]

!unzip /content/[Link] -d /content/final

from [Link] import precision_recall_fscore_support,

accuracy_score
import numpy as np

from [Link] import DataLoader, random_split

from torchvision import transforms, datasets
from torchvision import models
from torch import nn, optim
import torch

# Step 1: Dataset Preparation

# Dataset path
data_dir = r"/content/final/Dataset" # Update this to your dataset
path

# Define transformations
transform = [Link]([
[Link]((224, 224)), # Standard input size for most
models
[Link](),
[Link](mean=[0.485, 0.456, 0.406], std=[0.229,
0.224, 0.225])
])

# Load complete dataset

dataset = [Link](data_dir, transform=transform)

# Split dataset into training (70%) and testing (30%)

train_size = int(0.7 * len(dataset))
test_size = len(dataset) - train_size
train_dataset, test_dataset = random_split(dataset, [train_size,
test_size])

# Create DataLoaders
batch_size = 32
train_loader = DataLoader(train_dataset, batch_size=batch_size,
shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=batch_size,
shuffle=False)

# Number of classes
num_classes = len([Link])
print(f"Number of classes: {num_classes}")
print(f"Classes: {[Link]}")

# Step 2: AlexNet Model

# Initialize the device
device = [Link]("cuda" if [Link].is_available() else "cpu")
print(f"Using device: {device}")

# Updated evaluation function to include precision, recall, F1-score

def train_and_evaluate_AlexNet(train_loader, test_loader, num_classes,
epochs=5):
# Load pretrained AlexNet model
model = [Link](pretrained=True).to(device)

# Modify the classifier for the number of classes in the dataset

[Link][6] = [Link]([Link][6].in_features,
num_classes).to(device)

# Define loss function and optimizer

criterion = [Link]()
optimizer = [Link]([Link](), lr=0.001)

# Training loop
for epoch in range(epochs):
[Link]()
running_loss = 0.0
for inputs, labels in train_loader:
inputs, labels = [Link](device), [Link](device)
optimizer.zero_grad()
outputs = model(inputs)
loss = criterion(outputs, labels)
[Link]()
[Link]()
running_loss += [Link]()
print(f"Epoch {epoch+1}/{epochs} - Loss:
{running_loss/len(train_loader):.4f}")

# Evaluation
[Link]()
all_preds = []
all_labels = []
with torch.no_grad():
for inputs, labels in test_loader:
inputs, labels = [Link](device), [Link](device)
outputs = model(inputs)
_, preds = [Link](outputs, 1)
all_preds.extend([Link]().numpy())
all_labels.extend([Link]().numpy())
# Calculate metrics
all_preds = [Link](all_preds)
all_labels = [Link](all_labels)

accuracy = accuracy_score(all_labels, all_preds) * 100

precision, recall, f1, _ =
precision_recall_fscore_support(all_labels, all_preds,
average='weighted')

print(f"AlexNet Accuracy on Test Set: {accuracy:.2f}%")

print(f"Precision: {precision:.4f}")
print(f"Recall: {recall:.4f}")
print(f"F1-Score: {f1:.4f}")

# Call the function

train_and_evaluate_AlexNet(train_loader, test_loader, num_classes,
epochs=5)

Number of classes: 4
Classes: ['Bus', 'Car', 'Truck', 'motorcycle']
Using device: cuda

/usr/local/lib/python3.10/dist-packages/torchvision/models/
_utils.py:208: UserWarning: The parameter 'pretrained' is deprecated
since 0.13 and may be removed in the future, please use 'weights'
instead.
[Link](
/usr/local/lib/python3.10/dist-packages/torchvision/models/_utils.py:2
23: UserWarning: Arguments other than a weight enum or `None` for
'weights' are deprecated since 0.13 and may be removed in the future.
The current behavior is equivalent to passing
`weights=AlexNet_Weights.IMAGENET1K_V1`. You can also use
`weights=AlexNet_Weights.DEFAULT` to get the most up-to-date weights.
[Link](msg)
Downloading: "[Link]
[Link]" to /root/.cache/torch/hub/checkpoints/alexnet-owt-
[Link]
100%|██████████| 233M/233M [00:01<00:00, 150MB/s]
/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Epoch 1/5 - Loss: 1.6853

Epoch 2/5 - Loss: 1.3936
Epoch 3/5 - Loss: 1.3958
Epoch 4/5 - Loss: 1.3907
Epoch 5/5 - Loss: 1.3893
AlexNet Accuracy on Test Set: 22.50%
Precision: 0.0506
Recall: 0.2250
F1-Score: 0.0827

/usr/local/lib/python3.10/dist-packages/sklearn/metrics/
_classification.py:1531: UndefinedMetricWarning: Precision is ill-
defined and being set to 0.0 in labels with no predicted samples. Use
`zero_division` parameter to control this behavior.
_warn_prf(average, modifier, f"{[Link]()} is",
len(result))

from torchvision import models

from torch import nn, optim
import torch
from tqdm import tqdm
from [Link] import precision_recall_fscore_support,
accuracy_score
import numpy as np

# Define the device

device = [Link]("cuda" if [Link].is_available() else "cpu")
print(f"Using device: {device}")

# Training and evaluation function for VGG16

def train_and_evaluate_VGG16(train_loader, test_loader, num_classes,
epochs=5):
# Load the pretrained VGG16 model
model = models.vgg16(pretrained=True).to(device)

# Modify the classifier to match the number of classes in the

dataset
[Link][6] = [Link]([Link][6].in_features,
num_classes).to(device)

# Define the loss function and optimizer

criterion = [Link]()
optimizer = [Link]([Link](), lr=0.001)

print(f"Epoch {epoch+1}/{epochs} - Loss:

{running_loss/len(train_loader):.4f}")

# Calculate metrics
all_preds = [Link](all_preds)
all_labels = [Link](all_labels)

accuracy = accuracy_score(all_labels, all_preds) * 100

precision, recall, f1, _ =
precision_recall_fscore_support(all_labels, all_preds,
average='weighted')

print(f"VGG16 Accuracy on Test Set: {accuracy:.2f}%")

print(f"Precision: {precision:.4f}")
print(f"Recall: {recall:.4f}")
print(f"F1-Score: {f1:.4f}")

# Call the function

# Ensure train_loader, test_loader, and num_classes are already
defined
train_and_evaluate_VGG16(train_loader, test_loader, num_classes,
epochs=5)

Using device: cuda

/usr/local/lib/python3.10/dist-packages/torchvision/models/
_utils.py:208: UserWarning: The parameter 'pretrained' is deprecated
since 0.13 and may be removed in the future, please use 'weights'
instead.
[Link](
/usr/local/lib/python3.10/dist-packages/torchvision/models/_utils.py:2
23: UserWarning: Arguments other than a weight enum or `None` for
'weights' are deprecated since 0.13 and may be removed in the future.
The current behavior is equivalent to passing
`weights=VGG16_Weights.IMAGENET1K_V1`. You can also use
`weights=VGG16_Weights.DEFAULT` to get the most up-to-date weights.
[Link](msg)
Downloading: "[Link]
to /root/.cache/torch/hub/checkpoints/[Link]
100%|██████████| 528M/528M [00:03<00:00, 157MB/s]
Epoch 1/5: 67%|██████▋ | 6/9 [00:10<00:05,
1.72s/it]/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](
Epoch 1/5: 100%|██████████| 9/9 [00:14<00:00, 1.56s/it]

Epoch 1/5 - Loss: 3.5817

Epoch 2/5: 100%|██████████| 9/9 [00:13<00:00, 1.47s/it]

Epoch 2/5 - Loss: 1.4097

Epoch 3/5: 100%|██████████| 9/9 [00:12<00:00, 1.44s/it]

Epoch 3/5 - Loss: 1.4017

Epoch 4/5: 100%|██████████| 9/9 [00:13<00:00, 1.46s/it]

Epoch 4/5 - Loss: 1.4482

Epoch 5/5: 100%|██████████| 9/9 [00:13<00:00, 1.47s/it]

Epoch 5/5 - Loss: 1.3835

VGG16 Accuracy on Test Set: 26.67%
Precision: 0.1221
Recall: 0.2667
F1-Score: 0.1671

import torch
from torch import nn, optim
from torchvision import datasets, transforms
from [Link] import DataLoader, random_split
from tqdm import tqdm
from [Link] import precision_recall_fscore_support,
accuracy_score
import numpy as np

# Define the LeNet model

class LeNet([Link]):
def __init__(self, num_classes):
super(LeNet, self).__init__()
self.conv1 = nn.Conv2d(3, 6, kernel_size=5) # 3 input
channels (RGB)
self.conv2 = nn.Conv2d(6, 16, kernel_size=5)
self.fc1 = [Link](16 * 53 * 53, 120) # Adjust input size
for your dataset
self.fc2 = [Link](120, 84)
self.fc3 = [Link](84, num_classes)

def forward(self, x):

x = [Link](self.conv1(x))
x = torch.max_pool2d(x, kernel_size=2, stride=2)
x = [Link](self.conv2(x))
x = torch.max_pool2d(x, kernel_size=2, stride=2)
x = [Link]([Link](0), -1) # Flatten for fully connected
layers
x = [Link](self.fc1(x))
x = [Link](self.fc2(x))
x = self.fc3(x)
return x

# Define the device

device = [Link]("cuda" if [Link].is_available() else "cpu")
print(f"Using device: {device}")

# Define the training and evaluation function

def train_and_evaluate_LeNet(train_loader, test_loader, num_classes,
epochs=5):
# Initialize the LeNet model
model = LeNet(num_classes).to(device)

# Define the loss function and optimizer

criterion = [Link]()
optimizer = [Link]([Link](), lr=0.001)

# Training loop
for epoch in range(epochs):
[Link]()
running_loss = 0.0
for inputs, labels in tqdm(train_loader, desc=f"Epoch
{epoch+1}/{epochs}"):
inputs, labels = [Link](device), [Link](device)
optimizer.zero_grad()
outputs = model(inputs)
loss = criterion(outputs, labels)
[Link]()
[Link]()
running_loss += [Link]()
print(f"Epoch {epoch+1}/{epochs} - Loss:
{running_loss/len(train_loader):.4f}")
# Evaluation
[Link]()
all_preds = []
all_labels = []
with torch.no_grad():
for inputs, labels in test_loader:
inputs, labels = [Link](device), [Link](device)
outputs = model(inputs)
_, preds = [Link](outputs, 1)
all_preds.extend([Link]().numpy())
all_labels.extend([Link]().numpy())

# Calculate metrics
all_preds = [Link](all_preds)
all_labels = [Link](all_labels)

accuracy = accuracy_score(all_labels, all_preds) * 100

precision, recall, f1, _ =
precision_recall_fscore_support(all_labels, all_preds,
average='weighted')

print(f"LeNet Accuracy on Test Set: {accuracy:.2f}%")

print(f"Precision: {precision:.4f}")
print(f"Recall: {recall:.4f}")
print(f"F1-Score: {f1:.4f}")

# Dataset Preparation
data_dir = r"/content/final/Dataset" # Update with your dataset path
transform = [Link]([
[Link]((224, 224)), # Resize for LeNet input
[Link](),
[Link](mean=[0.485, 0.456, 0.406], std=[0.229,
0.224, 0.225])
])

dataset = [Link](data_dir, transform=transform)

# Split into training and testing sets

train_size = int(0.7 * len(dataset))
test_size = len(dataset) - train_size
train_dataset, test_dataset = random_split(dataset, [train_size,
test_size])

# Create DataLoaders
batch_size = 32
train_loader = DataLoader(train_dataset, batch_size=batch_size,
shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=batch_size,
shuffle=False)
# Number of classes
num_classes = len([Link])
print(f"Number of classes: {num_classes}")
print(f"Classes: {[Link]}")

# Train and evaluate LeNet

train_and_evaluate_LeNet(train_loader, test_loader, num_classes,
epochs=5)

Using device: cuda

Number of classes: 4
Classes: ['Bus', 'Car', 'Truck', 'motorcycle']

Epoch 1/5: 22%|██▏ | 2/9 [00:01<00:03,

1.75it/s]/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](
Epoch 1/5: 100%|██████████| 9/9 [00:08<00:00, 1.06it/s]

Epoch 1/5 - Loss: 1.3808

Epoch 2/5: 100%|██████████| 9/9 [00:09<00:00, 1.04s/it]

Epoch 2/5 - Loss: 1.0704

Epoch 3/5: 100%|██████████| 9/9 [00:10<00:00, 1.16s/it]

Epoch 3/5 - Loss: 0.7165

Epoch 4/5: 100%|██████████| 9/9 [00:09<00:00, 1.04s/it]

Epoch 4/5 - Loss: 0.5021

Epoch 5/5: 100%|██████████| 9/9 [00:08<00:00, 1.11it/s]

Epoch 5/5 - Loss: 0.2552

LeNet Accuracy on Test Set: 54.17%
Precision: 0.5266
Recall: 0.5417
F1-Score: 0.5285

import torch
import [Link] as nn
import [Link] as optim
from [Link] import DataLoader, random_split
from torchvision import datasets, transforms
from [Link] import Variable
from tqdm import tqdm
import os
from PIL import Image
# 1. ZFNet Model Definition
class ZFNet([Link]):
def __init__(self, num_classes):
super(ZFNet, self).__init__()
# Convolutional Layers
self.conv1 = nn.Conv2d(3, 96, kernel_size=7, stride=2,
padding=1) # Output: 96 x 111 x 111
self.conv2 = nn.Conv2d(96, 256, kernel_size=5, stride=2,
padding=1) # Output: 256 x 27 x 27
self.conv3 = nn.Conv2d(256, 384, kernel_size=3, padding=1) #
Output: 384 x 13 x 13
self.conv4 = nn.Conv2d(384, 384, kernel_size=3, padding=1) #
Output: 384 x 13 x 13
self.conv5 = nn.Conv2d(384, 256, kernel_size=3, padding=1) #
Output: 256 x 6 x 6

# Pooling Layer
[Link] = nn.MaxPool2d(kernel_size=3, stride=2)

# Placeholder for flattened size

self._to_linear = None

# Fully Connected Layers

self.fc1 = None
self.fc2 = [Link](4096, 4096)
self.fc3 = [Link](4096, num_classes)

def forward(self, x):

# Pass through convolutional layers
x = [Link](self.conv1(x))
x = [Link](x)
x = [Link](self.conv2(x))
x = [Link](x)
x = [Link](self.conv3(x))
x = [Link](self.conv4(x))
x = [Link](self.conv5(x))
x = [Link](x)

# Dynamically set the size of fc1

if self._to_linear is None:
self._to_linear = [Link]([Link](0), -1).size(1)
self.fc1 = [Link](self._to_linear, 4096).to([Link])
# Initialize fc1 dynamically

# Flatten the tensor

x = [Link]([Link](0), -1)

# Pass through fully connected layers

x = [Link](self.fc1(x))
x = [Link](self.fc2(x))
x = self.fc3(x)
return x

# 2. Dataset Preparation with Random Split

data_transforms = [Link]([
[Link]((224, 224)), # Resize images to 224x224
[Link](), # Augmentation: Flip images
randomly
[Link](), # Convert images to tensor
[Link](mean=[0.485, 0.456, 0.406], std=[0.229,
0.224, 0.225]) # Normalize to ImageNet stats
])

# Path to your dataset folder (with subfolders like Bus, Car, etc.)
data_dir = '/content/final/Dataset' # Change this path to your
dataset directory

# Load dataset using ImageFolder

dataset = [Link](data_dir, transform=data_transforms)

# Calculate the size for train/val split (80% train, 20% validation)
train_size = int(0.8 * len(dataset))
val_size = len(dataset) - train_size

# Split the dataset into train and validation sets

train_dataset, val_dataset = random_split(dataset, [train_size,
val_size])

# DataLoaders for batch processing

train_loader = DataLoader(train_dataset, batch_size=32, shuffle=True)
val_loader = DataLoader(val_dataset, batch_size=32, shuffle=False)

# 3. Initialize the Model, Loss, and Optimizer

num_classes = len([Link]) # Number of classes (e.g., 4
classes: Bus, Car, Motorcycle, Truck)
model = ZFNet(num_classes=num_classes)

device = [Link]("cuda" if [Link].is_available() else "cpu")

model = [Link](device)

# Loss and Optimizer

criterion = [Link]()
optimizer = [Link]([Link](), lr=0.001)

from [Link] import precision_recall_fscore_support,

accuracy_score
import numpy as np
# 4. Training the Model with Metrics Calculation
def train_model_with_metrics(model, criterion, optimizer,
num_epochs=25):
best_model_wts = model.state_dict()
best_acc = 0.0

for epoch in range(num_epochs):

print(f'Epoch {epoch}/{num_epochs - 1}')
print('-' * 10)

# Training phase
[Link]()
running_loss = 0.0
running_corrects = 0

for inputs, labels in tqdm(train_loader):

inputs, labels = [Link](device), [Link](device)

optimizer.zero_grad()

# Forward
outputs = model(inputs)
loss = criterion(outputs, labels)

# Backward
[Link]()
[Link]()

# Statistics
_, preds = [Link](outputs, 1)
running_loss += [Link]() * [Link](0)
running_corrects += [Link](preds == [Link])

epoch_loss = running_loss / len(train_loader.dataset)

epoch_acc = running_corrects.double() /
len(train_loader.dataset)

print(f'Train Loss: {epoch_loss:.4f} Acc: {epoch_acc:.4f}')

# Validation phase
[Link]()
running_corrects = 0
all_preds = []
all_labels = []

for inputs, labels in val_loader:

inputs, labels = [Link](device), [Link](device)

with torch.no_grad():
outputs = model(inputs)
_, preds = [Link](outputs, 1)

# Store predictions and labels for metrics

all_preds.extend([Link]().numpy())
all_labels.extend([Link]().numpy())

running_corrects += [Link](preds == [Link])

# Calculate metrics
all_preds = [Link](all_preds)
all_labels = [Link](all_labels)

val_acc = accuracy_score(all_labels, all_preds) * 100

precision, recall, f1, _ =
precision_recall_fscore_support(all_labels, all_preds,
average='weighted')

print(f'Validation Accuracy: {val_acc:.2f}%')

print(f'Precision: {precision:.4f}')
print(f'Recall: {recall:.4f}')
print(f'F1-Score: {f1:.4f}')

# Deep copy the model if it's the best so far

if val_acc > best_acc:
best_acc = val_acc
best_model_wts = model.state_dict()

print(f'Best Validation Accuracy: {best_acc:.2f}%')

model.load_state_dict(best_model_wts)
return model

# Train the model

model = train_model_with_metrics(model, criterion, optimizer,
num_epochs=25)

Epoch 0/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.07s/it]

Train Loss: 1.6090 Acc: 0.2406

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](
/usr/local/lib/python3.10/dist-packages/sklearn/metrics/_classificatio
[Link]: UndefinedMetricWarning: Precision is ill-defined and being
set to 0.0 in labels with no predicted samples. Use `zero_division`
parameter to control this behavior.
_warn_prf(average, modifier, f"{[Link]()} is",
len(result))

Validation Accuracy: 23.75%

Precision: 0.0963
Recall: 0.2375
F1-Score: 0.1300
Epoch 1/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 1.3903 Acc: 0.2656

Validation Accuracy: 25.00%

Precision: 0.1450
Recall: 0.2500
F1-Score: 0.1197
Epoch 2/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.00s/it]

Train Loss: 1.3892 Acc: 0.2438

Validation Accuracy: 23.75%

Precision: 0.0564
Recall: 0.2375
F1-Score: 0.0912
Epoch 3/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.01it/s]

Train Loss: 1.3818 Acc: 0.2563

Validation Accuracy: 21.25%

Precision: 0.1092
Recall: 0.2125
F1-Score: 0.1378
Epoch 4/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.01it/s]

Train Loss: 1.4098 Acc: 0.2625

Validation Accuracy: 26.25%

Precision: 0.0689
Recall: 0.2625
F1-Score: 0.1092
Epoch 5/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.00s/it]

Train Loss: 1.3906 Acc: 0.2469

Validation Accuracy: 26.25%

Precision: 0.0689
Recall: 0.2625
F1-Score: 0.1092
Epoch 6/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 1.3880 Acc: 0.2250

Validation Accuracy: 23.75%

Precision: 0.0609
Recall: 0.2375
F1-Score: 0.0969
Epoch 7/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.07s/it]

Train Loss: 1.3881 Acc: 0.2281

Validation Accuracy: 27.50%

Precision: 0.1543
Recall: 0.2750
F1-Score: 0.1490
Epoch 8/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.01s/it]

Train Loss: 1.3804 Acc: 0.2531

Validation Accuracy: 32.50%

Precision: 0.2684
Recall: 0.3250
F1-Score: 0.2655
Epoch 9/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 1.3446 Acc: 0.2969

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 48.75%

Precision: 0.4777
Recall: 0.4875
F1-Score: 0.4274
Epoch 10/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.01it/s]

Train Loss: 1.2988 Acc: 0.3688

Validation Accuracy: 45.00%

Precision: 0.3597
Recall: 0.4500
F1-Score: 0.3878
Epoch 11/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.01s/it]

Train Loss: 1.2850 Acc: 0.3656

Validation Accuracy: 42.50%

Precision: 0.3272
Recall: 0.4250
F1-Score: 0.3669
Epoch 12/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.00s/it]

Train Loss: 1.2114 Acc: 0.4625

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 51.25%

Precision: 0.5125
Recall: 0.5125
F1-Score: 0.4668
Epoch 13/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 1.1532 Acc: 0.4969

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 52.50%

Precision: 0.5232
Recall: 0.5250
F1-Score: 0.4825
Epoch 14/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 1.0977 Acc: 0.5156

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 47.50%

Precision: 0.5138
Recall: 0.4750
F1-Score: 0.4652
Epoch 15/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.00s/it]

Train Loss: 1.0509 Acc: 0.5344

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 47.50%

Precision: 0.4834
Recall: 0.4750
F1-Score: 0.4201
Epoch 16/24
----------
100%|██████████| 10/10 [00:09<00:00, 1.02it/s]

Train Loss: 1.0008 Acc: 0.6031

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 53.75%

Precision: 0.5349
Recall: 0.5375
F1-Score: 0.5203
Epoch 17/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.01it/s]

Train Loss: 0.9009 Acc: 0.6188

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 57.50%

Precision: 0.6244
Recall: 0.5750
F1-Score: 0.5744
Epoch 18/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 0.8418 Acc: 0.6375

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 63.75%

Precision: 0.6349
Recall: 0.6375
F1-Score: 0.6345
Epoch 19/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 0.8674 Acc: 0.6531

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 57.50%

Precision: 0.6378
Recall: 0.5750
F1-Score: 0.5597
Epoch 20/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.01it/s]

Train Loss: 0.7596 Acc: 0.7125

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 57.50%

Precision: 0.5731
Recall: 0.5750
F1-Score: 0.5650
Epoch 21/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.00it/s]

Train Loss: 0.6961 Acc: 0.7563

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 60.00%

Precision: 0.6005
Recall: 0.6000
F1-Score: 0.5906
Epoch 22/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.01it/s]

Train Loss: 0.6176 Acc: 0.7563

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](
Validation Accuracy: 58.75%
Precision: 0.6079
Recall: 0.5875
F1-Score: 0.5611
Epoch 23/24
----------

100%|██████████| 10/10 [00:10<00:00, 1.00s/it]

Train Loss: 0.6368 Acc: 0.7344

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 62.50%

Precision: 0.6434
Recall: 0.6250
F1-Score: 0.6148
Epoch 24/24
----------

100%|██████████| 10/10 [00:09<00:00, 1.01it/s]

Train Loss: 0.5416 Acc: 0.7938

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Validation Accuracy: 66.25%

Precision: 0.6651
Recall: 0.6625
F1-Score: 0.6517
Best Validation Accuracy: 66.25%

import torch
from torch import nn, optim
from torchvision import datasets, transforms, models
from [Link] import DataLoader, random_split
from tqdm import tqdm

# Dataset path
data_dir = r"/content/final/Dataset" # Update with your dataset path

# Define transformations (ResNet requires specific normalization)

transform = [Link]([
[Link]((224, 224)), # Resize for ResNet input
[Link](),
[Link](mean=[0.485, 0.456, 0.406], std=[0.229,
0.224, 0.225])
])

# Load dataset
dataset = [Link](data_dir, transform=transform)

# Split dataset into training (70%) and testing (30%)

train_size = int(0.7 * len(dataset))
test_size = len(dataset) - train_size
train_dataset, test_dataset = random_split(dataset, [train_size,
test_size])

# Create DataLoaders
batch_size = 32
train_loader = DataLoader(train_dataset, batch_size=batch_size,
shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=batch_size,
shuffle=False)

# Number of classes
num_classes = len([Link])
print(f"Number of classes: {num_classes}")
print(f"Classes: {[Link]}")

# Define the device (GPU or CPU)

device = [Link]("cuda" if [Link].is_available() else "cpu")
print(f"Using device: {device}")

# Load a pre-trained ResNet model

model = models.resnet50(pretrained=True).to(device) # You can also
try resnet18, resnet34, etc.

# Modify the fully connected layer to match the number of classes

[Link] = [Link]([Link].in_features, num_classes).to(device)

# Define loss function and optimizer

criterion = [Link]()
optimizer = [Link]([Link](), lr=0.001)
from [Link] import precision_recall_fscore_support,
accuracy_score
import numpy as np

# Training and evaluation loop with metrics

def train_and_evaluate_resnet_with_metrics(train_loader, test_loader,
model, criterion, optimizer, num_classes, epochs=5):
for epoch in range(epochs):
[Link]()
running_loss = 0.0
for inputs, labels in tqdm(train_loader, desc=f"Epoch
{epoch+1}/{epochs}"):
inputs, labels = [Link](device), [Link](device)
optimizer.zero_grad()
outputs = model(inputs)
loss = criterion(outputs, labels)
[Link]()
[Link]()
running_loss += [Link]()

print(f"Epoch {epoch+1}/{epochs} - Loss:

{running_loss/len(train_loader):.4f}")

# Evaluation
[Link]()
all_preds = []
all_labels = []

with torch.no_grad():
for inputs, labels in test_loader:
inputs, labels = [Link](device), [Link](device)
outputs = model(inputs)
_, preds = [Link](outputs, 1)

# Store predictions and labels for metrics calculation

all_preds.extend([Link]().numpy())
all_labels.extend([Link]().numpy())

# Calculate metrics
all_preds = [Link](all_preds)
all_labels = [Link](all_labels)

accuracy = accuracy_score(all_labels, all_preds) * 100

precision, recall, f1, _ =
precision_recall_fscore_support(all_labels, all_preds,
average='weighted')

print(f"\nEvaluation Metrics on Test Set:")

print(f"Accuracy: {accuracy:.2f}%")
print(f"Precision: {precision:.4f}")
print(f"Recall: {recall:.4f}")
print(f"F1-Score: {f1:.4f}")

# Call the updated function to train and evaluate the model with
metrics
train_and_evaluate_resnet_with_metrics(train_loader, test_loader,
model, criterion, optimizer, num_classes, epochs=5)

Number of classes: 4
Classes: ['Bus', 'Car', 'Truck', 'motorcycle']
Using device: cuda
/usr/local/lib/python3.10/dist-packages/torchvision/models/
_utils.py:208: UserWarning: The parameter 'pretrained' is deprecated
since 0.13 and may be removed in the future, please use 'weights'
instead.
[Link](
/usr/local/lib/python3.10/dist-packages/torchvision/models/_utils.py:2
23: UserWarning: Arguments other than a weight enum or `None` for
'weights' are deprecated since 0.13 and may be removed in the future.
The current behavior is equivalent to passing
`weights=ResNet50_Weights.IMAGENET1K_V1`. You can also use
`weights=ResNet50_Weights.DEFAULT` to get the most up-to-date weights.
[Link](msg)
Downloading: "[Link]
[Link]" to /root/.cache/torch/hub/checkpoints/resnet50-
[Link]
100%|██████████| 97.8M/97.8M [00:00<00:00, 160MB/s]
Epoch 1/5: 100%|██████████| 9/9 [00:10<00:00, 1.19s/it]

Epoch 1/5 - Loss: 0.7649

Epoch 2/5: 100%|██████████| 9/9 [00:10<00:00, 1.15s/it]

Epoch 2/5 - Loss: 0.5734

Epoch 3/5: 100%|██████████| 9/9 [00:11<00:00, 1.22s/it]

Epoch 3/5 - Loss: 0.3695

Epoch 4/5: 100%|██████████| 9/9 [00:10<00:00, 1.22s/it]

Epoch 4/5 - Loss: 0.1897

Epoch 5/5: 100%|██████████| 9/9 [00:10<00:00, 1.21s/it]

Epoch 5/5 - Loss: 0.0882

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Evaluation Metrics on Test Set:

Accuracy: 79.17%
Precision: 0.8028
Recall: 0.7917
F1-Score: 0.7929

import torch
from torch import nn, optim
from torchvision import datasets, transforms, models
from [Link] import DataLoader, random_split
from tqdm import tqdm

# Dataset path
data_dir = r"/content/final/Dataset" # Update with your dataset path

# Define transformations (VGG requires specific normalization)

transform = [Link]([
[Link]((224, 224)), # Resize for VGG16 input
[Link](),
[Link](mean=[0.485, 0.456, 0.406], std=[0.229,
0.224, 0.225])
])

# Load dataset
dataset = [Link](data_dir, transform=transform)

# Split dataset into training (70%) and testing (30%)

train_size = int(0.7 * len(dataset))
test_size = len(dataset) - train_size
train_dataset, test_dataset = random_split(dataset, [train_size,
test_size])

# Create DataLoaders
batch_size = 32
train_loader = DataLoader(train_dataset, batch_size=batch_size,
shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=batch_size,
shuffle=False)

# Number of classes
num_classes = len([Link])
print(f"Number of classes: {num_classes}")
print(f"Classes: {[Link]}")

# Define the device (GPU or CPU)

device = [Link]("cuda" if [Link].is_available() else "cpu")
print(f"Using device: {device}")

# Load a pre-trained VGG16 model

model = models.vgg16(pretrained=True).to(device)

# Modify the fully connected layers to match the number of classes

[Link][6] = [Link]([Link][6].in_features,
num_classes).to(device)

# Define loss function and optimizer

criterion = [Link]()
optimizer = [Link]([Link](), lr=0.001)

from [Link] import precision_recall_fscore_support,

accuracy_score
import numpy as np

# Training and evaluation loop with metrics

def train_and_evaluate_vgg16_with_metrics(train_loader, test_loader,
model, criterion, optimizer, num_classes, epochs=5):
for epoch in range(epochs):
[Link]()
running_loss = 0.0
for inputs, labels in tqdm(train_loader, desc=f"Epoch
{epoch+1}/{epochs}"):
inputs, labels = [Link](device), [Link](device)
optimizer.zero_grad()
outputs = model(inputs)
loss = criterion(outputs, labels)
[Link]()
[Link]()
running_loss += [Link]()

print(f"Epoch {epoch+1}/{epochs} - Loss:

{running_loss/len(train_loader):.4f}")

# Evaluation
[Link]()
all_preds = []
all_labels = []

with torch.no_grad():
for inputs, labels in test_loader:
inputs, labels = [Link](device), [Link](device)
outputs = model(inputs)
_, preds = [Link](outputs, 1)

# Store predictions and labels for metrics calculation

all_preds.extend([Link]().numpy())
all_labels.extend([Link]().numpy())

# Calculate metrics
all_preds = [Link](all_preds)
all_labels = [Link](all_labels)

accuracy = accuracy_score(all_labels, all_preds) * 100

precision, recall, f1, _ =
precision_recall_fscore_support(all_labels, all_preds,
average='weighted')

print(f"\nEvaluation Metrics on Test Set:")

print(f"Accuracy: {accuracy:.2f}%")
print(f"Precision: {precision:.4f}")
print(f"Recall: {recall:.4f}")
print(f"F1-Score: {f1:.4f}")

# Call the updated function to train and evaluate the model with
metrics
train_and_evaluate_vgg16_with_metrics(train_loader, test_loader,
model, criterion, optimizer, num_classes, epochs=5)

Number of classes: 4
Classes: ['Bus', 'Car', 'Truck', 'motorcycle']
Using device: cuda

Epoch 1/5 - Loss: 1.9105

Epoch 2/5: 100%|██████████| 9/9 [00:13<00:00, 1.46s/it]

Epoch 2/5 - Loss: 1.9666

Epoch 3/5: 100%|██████████| 9/9 [00:12<00:00, 1.44s/it]

Epoch 3/5 - Loss: 1.4009

Epoch 4/5: 100%|██████████| 9/9 [00:12<00:00, 1.42s/it]

Epoch 4/5 - Loss: 1.3920

Epoch 5/5: 100%|██████████| 9/9 [00:13<00:00, 1.48s/it]

Epoch 5/5 - Loss: 1.3519

/usr/local/lib/python3.10/dist-packages/PIL/[Link]:
UserWarning: Palette images with Transparency expressed in bytes
should be converted to RGBA images
[Link](

Evaluation Metrics on Test Set:

Accuracy: 42.50%
Precision: 0.4012
Recall: 0.4250
F1-Score: 0.3700

Comparative Analysis of Model Performance

Model Accuracy (%) Precision Recall F1-Score
AlexNet 22.50 0.0506 0.2250 0.0827
VGG16 26.67 0.1221 0.2667 0.1671
LeNet 54.17 0.5266 0.5417 0.5285
ZFNet 66.25 0.6651 0.6625 0.6517
ResNet 79.17 0.8028 0.7917 0.7929

CNN Implementation with ResNet in Colab
No ratings yet
CNN Implementation with ResNet in Colab
7 pages
Computer Vision Assignment 3 Guide
No ratings yet
Computer Vision Assignment 3 Guide
11 pages
ResNet50 Model Setup in PyTorch
No ratings yet
ResNet50 Model Setup in PyTorch
55 pages
PyTorch Linear Regression Guide
No ratings yet
PyTorch Linear Regression Guide
10 pages
Banana Disease Recognition with ViT
No ratings yet
Banana Disease Recognition with ViT
38 pages
Mango Classification with MobileNetV2
No ratings yet
Mango Classification with MobileNetV2
13 pages
Federated Learning with CNN on MNIST
No ratings yet
Federated Learning with CNN on MNIST
3 pages
Fine-Tuning ResNet18 for CIFAR10 Accuracy
No ratings yet
Fine-Tuning ResNet18 for CIFAR10 Accuracy
9 pages
Fine-Tuning MobileNetV2 for Thyroid Detection
No ratings yet
Fine-Tuning MobileNetV2 for Thyroid Detection
4 pages
Agave Plant Maturation Model Analysis
No ratings yet
Agave Plant Maturation Model Analysis
7 pages
CNN Training on CIFAR-10 Dataset
No ratings yet
CNN Training on CIFAR-10 Dataset
8 pages
Training MobileNetV2 on HAM10000
No ratings yet
Training MobileNetV2 on HAM10000
3 pages
Validate YOLOv5 Model Accuracy
No ratings yet
Validate YOLOv5 Model Accuracy
9 pages
Mango Classification with ResNet18
No ratings yet
Mango Classification with ResNet18
13 pages
Weather Image Classification Model
No ratings yet
Weather Image Classification Model
4 pages
PyTorch Plant Disease Model Comparison
No ratings yet
PyTorch Plant Disease Model Comparison
27 pages
Install Keras, TensorFlow, PyTorch Guide
No ratings yet
Install Keras, TensorFlow, PyTorch Guide
4 pages
Lung Cancer CNN Model Training
No ratings yet
Lung Cancer CNN Model Training
11 pages
Federated Learning with FedRep CNN
No ratings yet
Federated Learning with FedRep CNN
3 pages
PyTorch Crash Course Overview
No ratings yet
PyTorch Crash Course Overview
15 pages
Neural Networks for CIFAR-10 Classification
No ratings yet
Neural Networks for CIFAR-10 Classification
6 pages
MNIST Softmax Regression Accuracy
No ratings yet
MNIST Softmax Regression Accuracy
3 pages
Build and Train CNN with PyTorch
No ratings yet
Build and Train CNN with PyTorch
23 pages
Intro to PyTorch Tensors and Models
No ratings yet
Intro to PyTorch Tensors and Models
12 pages
MLP Model for MNIST Classification
No ratings yet
MLP Model for MNIST Classification
7 pages
Build CNN Models with PyTorch Tutorial
No ratings yet
Build CNN Models with PyTorch Tutorial
4 pages
Kaiming Initialization in PyTorch
No ratings yet
Kaiming Initialization in PyTorch
37 pages
U-Net Semantic Segmentation in PyTorch
No ratings yet
U-Net Semantic Segmentation in PyTorch
15 pages
Build a 4-Layer Neural Network
No ratings yet
Build a 4-Layer Neural Network
5 pages
PyTorch Crash Course: Tensors & Autograd
No ratings yet
PyTorch Crash Course: Tensors & Autograd
16 pages
Food Segmentation with CCNet Model
No ratings yet
Food Segmentation with CCNet Model
6 pages
PyTorch Operations Cheat Sheet
No ratings yet
PyTorch Operations Cheat Sheet
7 pages
Autoencoder Implementation on MNIST
No ratings yet
Autoencoder Implementation on MNIST
15 pages
PyTorch Transfer Learning with ResNet
No ratings yet
PyTorch Transfer Learning with ResNet
13 pages
PyTorch Image Classification with ROC AUC
No ratings yet
PyTorch Image Classification with ROC AUC
3 pages
PyTorch Tensor Operations Cheat Sheet
No ratings yet
PyTorch Tensor Operations Cheat Sheet
7 pages
MLP with Sigmoid and MSE Loss
No ratings yet
MLP with Sigmoid and MSE Loss
20 pages
LSTM Streamflow Prediction Tutorial
No ratings yet
LSTM Streamflow Prediction Tutorial
22 pages
Deep Learning with PyTorch Guide
No ratings yet
Deep Learning with PyTorch Guide
34 pages
Object Detection with CNN in PyTorch
No ratings yet
Object Detection with CNN in PyTorch
8 pages
Deep Learning with PyTorch Guide
No ratings yet
Deep Learning with PyTorch Guide
1 page
Fruit Detection Model Training Guide
No ratings yet
Fruit Detection Model Training Guide
31 pages
Deep Learning with PyTorch Guide
No ratings yet
Deep Learning with PyTorch Guide
34 pages
Deep Learning Lab Manual with Code
No ratings yet
Deep Learning Lab Manual with Code
10 pages
MLP Training on Fashion-MNIST Dataset
No ratings yet
MLP Training on Fashion-MNIST Dataset
4 pages
Multilayer Perceptron in PyTorch
No ratings yet
Multilayer Perceptron in PyTorch
13 pages
PyTorch Cheat Sheet Reference Guide
No ratings yet
PyTorch Cheat Sheet Reference Guide
6 pages
MLP Implementation in PyTorch
No ratings yet
MLP Implementation in PyTorch
20 pages
Advanced Deep Learning with Keras
No ratings yet
Advanced Deep Learning with Keras
34 pages
SiLogLoss Implementation for Depth Estimation
No ratings yet
SiLogLoss Implementation for Depth Estimation
4 pages
Deep Learning Lab File for BCA Students
No ratings yet
Deep Learning Lab File for BCA Students
46 pages
Autoencoder Training with PyTorch
No ratings yet
Autoencoder Training with PyTorch
6 pages
Deep Learning with PyTorch Overview
No ratings yet
Deep Learning with PyTorch Overview
30 pages
Understanding Minusha Meaning
No ratings yet
Understanding Minusha Meaning
19 pages
PyTorch Tensors and Gradients Guide
No ratings yet
PyTorch Tensors and Gradients Guide
10 pages
CNN for Image Recognition and Classification
No ratings yet
CNN for Image Recognition and Classification
35 pages
Code Explanation for Model Training and Evaluation
No ratings yet
Code Explanation for Model Training and Evaluation
5 pages
MobileNet Training for Image Classification
No ratings yet
MobileNet Training for Image Classification
60 pages
PyTorch Two-Layer NN Tutorial
No ratings yet
PyTorch Two-Layer NN Tutorial
11 pages
Immune System Questions
No ratings yet
Immune System Questions
13 pages
EGR Delta Pressure Sensor Troubleshooting
No ratings yet
EGR Delta Pressure Sensor Troubleshooting
2 pages
Aerodrome Emergency Services Regulations
No ratings yet
Aerodrome Emergency Services Regulations
80 pages
Specification Sheet 3000 VI
No ratings yet
Specification Sheet 3000 VI
4 pages
Indian Standard: (Second Revision)
No ratings yet
Indian Standard: (Second Revision)
14 pages
Loss of Lumbar Lordosis and Homeo Remedies
No ratings yet
Loss of Lumbar Lordosis and Homeo Remedies
9 pages
INOX India Limited IPO Prospectus
No ratings yet
INOX India Limited IPO Prospectus
552 pages
Poetry Analysis: A Beginner's Guide
100% (4)
Poetry Analysis: A Beginner's Guide
21 pages
Agriculture Overview and Practices
No ratings yet
Agriculture Overview and Practices
62 pages
Saudi Aramco IPO Announcement on Tadawul
No ratings yet
Saudi Aramco IPO Announcement on Tadawul
3 pages
Introduction to Signals and Systems
No ratings yet
Introduction to Signals and Systems
38 pages
Masonic Philosophy: Morison Collection
No ratings yet
Masonic Philosophy: Morison Collection
3 pages
DPDP
No ratings yet
DPDP
74 pages
Retail Data Visualization with Tableau
No ratings yet
Retail Data Visualization with Tableau
5 pages
Microprocessor Lab Manual for EEE
No ratings yet
Microprocessor Lab Manual for EEE
87 pages
Frenal Attachment Classification and Issues
No ratings yet
Frenal Attachment Classification and Issues
90 pages
C++ MCQs with Answers for Practice
100% (6)
C++ MCQs with Answers for Practice
10 pages
Imparfait
No ratings yet
Imparfait
2 pages
Business Law Exam 1 Overview
No ratings yet
Business Law Exam 1 Overview
3 pages
XAVENTURE: Marketing Event at SXUK
No ratings yet
XAVENTURE: Marketing Event at SXUK
8 pages
Type 2 Diabetes Management Strategies
No ratings yet
Type 2 Diabetes Management Strategies
10 pages
Understanding Jesus' Parables
No ratings yet
Understanding Jesus' Parables
9 pages
Hospital Training Report by Pankaj Yadav
No ratings yet
Hospital Training Report by Pankaj Yadav
27 pages
Install AVEVA Licensing System 4.1 Guide
No ratings yet
Install AVEVA Licensing System 4.1 Guide
5 pages
Medical Terminology Review Sheet
No ratings yet
Medical Terminology Review Sheet
4 pages
Hadhrami Social Identity in Batavia (18th-20th)
No ratings yet
Hadhrami Social Identity in Batavia (18th-20th)
21 pages
Oscar Water Safety Lesson Plan
No ratings yet
Oscar Water Safety Lesson Plan
8 pages
Choir Participation Commitment Letter
No ratings yet
Choir Participation Commitment Letter
2 pages
Manning's Formula for Waste Piping
No ratings yet
Manning's Formula for Waste Piping
18 pages
Mobile App Trends for 2024 Insights
No ratings yet
Mobile App Trends for 2024 Insights
48 pages