0% found this document useful (0 votes)

15 views8 pages

Document 2

The document outlines the implementation of an object detection system using a Convolutional Neural Network (CNN) with a focus on the Faster R-CNN model. It includes code for data preparation, model training, evaluation, and visualization of predictions on the VOC dataset. Key components include data augmentation, model evaluation metrics, and saving/loading model states.

Uploaded by

gamernirmal67

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

15 views8 pages

Document 2

Uploaded by

gamernirmal67

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 8

JAL1611 NN & DL LABORATORY

Ex. No: 10

IMPLEMENTATION OF AN OBJECT DETECTION USING CNN

PROGRAM:
import os
import torch
from torch import optim
from torch.utils.data import DataLoader, Subset, random_split
from torchvision.datasets import VOCDetection
from torchvision import transforms, models
from torchvision.ops import box_iou
from torchvision.models.detection.faster_rcnn import FastRCNNPredictor
from torchvision.transforms import functional as F
from tqdm import tqdm
import matplotlib.pyplot as plt
import matplotlib.patches as patches
import numpy as np
import random
from PIL import Image
import multiprocessing
from torchmetrics.detection.mean_ap import MeanAveragePrecision

BATCH_SIZE = 2
NUM_EPOCHS = 5
NUM_SAMPLES = 200
VAL_RATIO = 0.2
TARGET_SIZE = (224, 224)
DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
MODEL_PATH = "fasterrcnn_model.pth"

VOC_CLASSES = [
'aeroplane', 'bicycle', 'bird', 'boat', 'bottle', 'bus', 'car', 'cat',
'chair', 'cow', 'diningtable', 'dog', 'horse', 'motorbike', 'person',
'pottedplant', 'sheep', 'sofa', 'train', 'tvmonitor'
]
label2idx = {cls: idx + 1 for idx, cls in enumerate(VOC_CLASSES)}

class VOCDataset(VOCDetection):
def __init__(self, root, year, image_set, transforms=None, augment=False):
super().__init__(root=root, year=year, image_set=image_set, download=True)
self.transforms = transforms
self.augment = augment

def getitem(self, index):

img, target = super().__getitem__(index)
ann = target['annotation']
objs = ann['object']
if isinstance(objs, dict): objs = [objs]

orig_w, orig_h = img.size

img = img.resize(TARGET_SIZE, Image.BILINEAR)

# Data augmentation: horizontal flip

if self.augment and random.random() > 0.5:
img = F.hflip(img)
flipped = True
else:
flipped = False

img_tensor = transforms.ToTensor()(img)
img_tensor = transforms.Normalize(mean=[0.485, 0.456, 0.406],
std=[0.229, 0.224, 0.225])(img_tensor)

scale_x = TARGET_SIZE[0] / orig_w

scale_y = TARGET_SIZE[1] / orig_h

boxes, labels = [], []

for obj in objs:
bbox = obj['bndbox']
x1 = float(bbox['xmin']) * scale_x
y1 = float(bbox['ymin']) * scale_y
x2 = float(bbox['xmax']) * scale_x
y2 = float(bbox['ymax']) * scale_y
if flipped:
x1, x2 = TARGET_SIZE[0] - x2, TARGET_SIZE[0] - x1
boxes.append(torch.tensor([x1, y1, x2, y2], dtype=torch.float32))
labels.append(label2idx.get(obj['name'], 0))
return img_tensor, {
'boxes': torch.stack(boxes) if boxes else torch.zeros((0, 4), dtype=torch.float32),
'labels': torch.tensor(labels, dtype=torch.int64) if labels else torch.zeros((0,),
dtype=torch.int64)
}

def collate_fn(batch):
return tuple(zip(*batch))

def evaluate_with_map(model, data_loader):

model.eval()
metric = MeanAveragePrecision()
with torch.no_grad():
for images, targets in data_loader:
images = [img.to(DEVICE) for img in images]
outputs = model(images)
for i in range(len(images)):
pred = {
"boxes": outputs[i]["boxes"].cpu(),
"scores": outputs[i]["scores"].cpu(),
"labels": outputs[i]["labels"].cpu()
}
tgt = {
"boxes": targets[i]["boxes"].cpu(),
"labels": targets[i]["labels"].cpu()
}
metric.update([pred], [tgt])

results = metric.compute()
print(f"\n Evaluation Metrics:")
print(f" mAP @ IoU=0.5: {results['map_50']:.4f}")
print(f" mAP @ IoU=0.5:0.95: {results['map']:.4f}")

def get_model():
model = models.detection.fasterrcnn_resnet50_fpn(
weights=models.detection.FasterRCNN_ResNet50_FPN_Weights.DEFAULT
)
in_features = model.roi_heads.box_predictor.cls_score.in_features
model.roi_heads.box_predictor = FastRCNNPredictor(in_features, len(VOC_CLASSES) + 1)
return model
def visualize_predictions(model, dataset, num_images=5):
model.eval()
indices = random.sample(range(len(dataset)), num_images)

for idx in indices:

img, target = dataset[idx]
img = img.to(DEVICE)

with torch.no_grad():
pred = model([img])[0]

img_np = img.permute(1, 2, 0).cpu().numpy()

img_np = np.clip((img_np * [0.229, 0.224, 0.225]) + [0.485, 0.456, 0.406], 0, 1)

fig, ax = plt.subplots(1, figsize=(8, 8))

ax.imshow(img_np)

for box, score, lbl in zip(pred['boxes'], pred['scores'], pred['labels']):

if score < 0.3:
continue
x1, y1, x2, y2 = box
rect = patches.Rectangle((x1, y1), x2 - x1, y2 - y1,
linewidth=2, edgecolor='r', facecolor='none')
ax.add_patch(rect)
cls_name = VOC_CLASSES[lbl - 1] if lbl > 0 else 'bg'
ax.text(x1, y1, f"{cls_name}:{score:.2f}", fontsize=8,
bbox=dict(facecolor='red', pad=0.3, alpha=0.5))

for gt_box in target['boxes']:

x1, y1, x2, y2 = gt_box
rect = patches.Rectangle((x1, y1), x2 - x1, y2 - y1,
linewidth=2, edgecolor='g', facecolor='none')
ax.add_patch(rect)

ax.axis('off')
ax.set_title(" Predicted | Ground Truth")
plt.tight_layout()
plt.show()

if __name__ == '__main__':
multiprocessing.freeze_support()
full_dataset = VOCDataset(root='./data', year='2007', image_set='train', augment=True)
random.seed(42)
indices = random.sample(range(len(full_dataset)), NUM_SAMPLES)
subset = Subset(full_dataset, indices)

n_val = int(VAL_RATIO * NUM_SAMPLES)

train_subset, val_subset = random_split(subset, [NUM_SAMPLES - n_val, n_val])

train_loader = DataLoader(train_subset, batch_size=BATCH_SIZE, shuffle=True,

num_workers=0, collate_fn=collate_fn)
val_loader = DataLoader(val_subset, batch_size=BATCH_SIZE, shuffle=False,
num_workers=0, collate_fn=collate_fn)

model = get_model().to(DEVICE)

if os.path.exists(MODEL_PATH):
print(f" Loading saved model from {MODEL_PATH}...")
model.load_state_dict(torch.load(MODEL_PATH, map_location=DEVICE))
model.eval()
else:
print(" Training new model...")
optimizer = optim.Adam(model.parameters(), lr=1e-4)
for epoch in range(NUM_EPOCHS):
loop = tqdm(train_loader, desc=f"Epoch {epoch+1}/{NUM_EPOCHS}")
for images, targets in loop:
images = [img.to(DEVICE) for img in images]
targets = [{k: v.to(DEVICE) for k, v in t.items()} for t in targets]

loss_dict = model(images, targets)

losses = sum(loss for loss in loss_dict.values())

optimizer.zero_grad()
losses.backward()
optimizer.step()

loop.set_postfix(loss=losses.item())

evaluate_with_map(model, val_loader)

torch.save(model.state_dict(), MODEL_PATH)
print(f" Model saved to {MODEL_PATH}")

visualize_predictions(model, full_dataset, num_images=10)

OUTPUT:

Training new model...

Epoch 1/5: 100%|██████████████████| … loss=1.234

Validation Mean IoU: 0.123

Epoch 2/5: 100%|██████████████████| … loss=0.987

Validation Mean IoU: 0.156

Epoch 5/5: 100%|██████████████████| … loss=0.543

Validation Mean IoU: 0.156

Epoch 5/5: 100%|██████████████████| … loss=0.543

Validation Mean IoU: 0.156

Epoch 5/5: 100%|██████████████████| … loss=0.543

Validation Mean IoU: 0.201

Model saved to fasterrcnn_model.pth

Genai 1,2,3
No ratings yet
Genai 1,2,3
15 pages
Converta Esse C
No ratings yet
Converta Esse C
15 pages
Quality Testing Resnet18 Compressed
No ratings yet
Quality Testing Resnet18 Compressed
13 pages
Quality Testing MobileNet V2 Compressed
No ratings yet
Quality Testing MobileNet V2 Compressed
13 pages
Paper Code
No ratings yet
Paper Code
3 pages
Python Code
No ratings yet
Python Code
3 pages
Paper Code 1
No ratings yet
Paper Code 1
3 pages
HW3 Pedro Aguiar
No ratings yet
HW3 Pedro Aguiar
9 pages
Pytorch Project Pedro Aguiar
No ratings yet
Pytorch Project Pedro Aguiar
27 pages
Braintumorcodewithnpz
No ratings yet
Braintumorcodewithnpz
3 pages
DL Programs
No ratings yet
DL Programs
36 pages
Lab 1 - Harshil - Parmar
No ratings yet
Lab 1 - Harshil - Parmar
2 pages
Skill 7
No ratings yet
Skill 7
11 pages
Softmax Regression Mnist
No ratings yet
Softmax Regression Mnist
3 pages
Experiment No 13 Final
No ratings yet
Experiment No 13 Final
9 pages
Code File
No ratings yet
Code File
6 pages
DLV Lab Manual Print
No ratings yet
DLV Lab Manual Print
29 pages
Cifar 100 Dataset
No ratings yet
Cifar 100 Dataset
4 pages
Tensorflow 2 Quickstart
No ratings yet
Tensorflow 2 Quickstart
2 pages
CVDL Tae 63
No ratings yet
CVDL Tae 63
9 pages
H1 AndresAlcivar
No ratings yet
H1 AndresAlcivar
4 pages
Val
No ratings yet
Val
9 pages
BLDD VIT ResNet50v2 CustomCNN
No ratings yet
BLDD VIT ResNet50v2 CustomCNN
38 pages
Vit32 GPTMD
No ratings yet
Vit32 GPTMD
6 pages
MNIST Tensorflow Mini Project 1749471354
No ratings yet
MNIST Tensorflow Mini Project 1749471354
4 pages
Ccnet Only
No ratings yet
Ccnet Only
6 pages
DL Ex 13
No ratings yet
DL Ex 13
5 pages
Wild Fire CNN Accuracy 95
No ratings yet
Wild Fire CNN Accuracy 95
15 pages
Lab 9
No ratings yet
Lab 9
29 pages
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
No ratings yet
CIFAR - 10 - Dataset - Using - CNN - Aniiiii - HTML
8 pages
Homework IntroToDL
No ratings yet
Homework IntroToDL
3 pages
ANN Detection Technique
No ratings yet
ANN Detection Technique
20 pages
Deep Learning for Fruit Detection
No ratings yet
Deep Learning for Fruit Detection
31 pages
Csc413 Project Semantic Segmentation
No ratings yet
Csc413 Project Semantic Segmentation
84 pages
Code
No ratings yet
Code
4 pages
Faster R-CNN
No ratings yet
Faster R-CNN
20 pages
Applied Machine and Deep Learning
No ratings yet
Applied Machine and Deep Learning
34 pages
Deep Learning Programs Updated
No ratings yet
Deep Learning Programs Updated
24 pages
DETECTCAMERA
No ratings yet
DETECTCAMERA
3 pages
Week 7 - Mnist-Mlp
No ratings yet
Week 7 - Mnist-Mlp
7 pages
Notebook - Agave Plant Maturation Model Inference and Testing
No ratings yet
Notebook - Agave Plant Maturation Model Inference and Testing
7 pages
Hyper Parameteres: Dataset
No ratings yet
Hyper Parameteres: Dataset
13 pages
VGG16 Estudo
No ratings yet
VGG16 Estudo
10 pages
Deep Learning for Image Classification
No ratings yet
Deep Learning for Image Classification
6 pages
Font Image Augmentation & Model Training
No ratings yet
Font Image Augmentation & Model Training
78 pages
CV Lab Final AwaisKhan EE A
No ratings yet
CV Lab Final AwaisKhan EE A
7 pages
Digital Tech for Experts
No ratings yet
Digital Tech for Experts
8 pages
Keras
No ratings yet
Keras
4 pages
PyTorch Autoencoder & VAE Tutorial
No ratings yet
PyTorch Autoencoder & VAE Tutorial
17 pages
PyTorch Cheat Sheet & Quick Reference
No ratings yet
PyTorch Cheat Sheet & Quick Reference
6 pages
TensorFlow Object Detection Guide
No ratings yet
TensorFlow Object Detection Guide
3 pages
361 Project Code
No ratings yet
361 Project Code
10 pages
Mobile Communications Networks - Midterm Exam - Feb 2025
No ratings yet
Mobile Communications Networks - Midterm Exam - Feb 2025
4 pages
XEV 9e Brochure
No ratings yet
XEV 9e Brochure
27 pages
3HAC16591 en
No ratings yet
3HAC16591 en
234 pages
Assignment3 AL
No ratings yet
Assignment3 AL
23 pages
(Deep Learning Using PyTorch) (Cheatsheet)
No ratings yet
(Deep Learning Using PyTorch) (Cheatsheet)
7 pages
Omron Program Copy From Card To PLC.
No ratings yet
Omron Program Copy From Card To PLC.
8 pages
Module 3 Notes
No ratings yet
Module 3 Notes
26 pages
CASE REPORT ON BMVSS - Changing Lives .
No ratings yet
CASE REPORT ON BMVSS - Changing Lives .
5 pages
Lab 4-Image Segmentation Using U-Net
No ratings yet
Lab 4-Image Segmentation Using U-Net
9 pages
Image Classification with PyTorch
No ratings yet
Image Classification with PyTorch
19 pages
Ilovepdf Merged
No ratings yet
Ilovepdf Merged
10 pages
Assignment 3 DS5620
No ratings yet
Assignment 3 DS5620
11 pages
1 s2.0 S0141029619311046 Main
No ratings yet
1 s2.0 S0141029619311046 Main
11 pages
TTL 1 UNIT 1 Intro and Lesson 1 T
No ratings yet
TTL 1 UNIT 1 Intro and Lesson 1 T
32 pages
Lecture05 IntervalTree
No ratings yet
Lecture05 IntervalTree
4 pages
LOREAL 2023 Universal Registration Document en
No ratings yet
LOREAL 2023 Universal Registration Document en
450 pages
Hussein 2015
No ratings yet
Hussein 2015
4 pages
مكاتب استشارية الكويت PDF
No ratings yet
مكاتب استشارية الكويت PDF
2 pages
2023 11 20 Edip Selections
No ratings yet
2023 11 20 Edip Selections
123 pages
Transfer Learning For Image Classification in Pytorch
No ratings yet
Transfer Learning For Image Classification in Pytorch
13 pages
Stacey Evans Letter To Cobb 11.17.22
No ratings yet
Stacey Evans Letter To Cobb 11.17.22
14 pages
Intro To Pytorch
No ratings yet
Intro To Pytorch
12 pages
The Top 10 High-Demand Jobs With Attractive Salaries
No ratings yet
The Top 10 High-Demand Jobs With Attractive Salaries
54 pages
Warning!
No ratings yet
Warning!
6 pages
GOT2000 Connection Manual ENG
No ratings yet
GOT2000 Connection Manual ENG
388 pages
Load Schedules For Lighting Panel Admin BLD 6 - 11-2023
No ratings yet
Load Schedules For Lighting Panel Admin BLD 6 - 11-2023
1 page
RS232 Standard
No ratings yet
RS232 Standard
27 pages
WaterShapes - Hydraulics-Hot-Tub-Concrete-Spa-Jets-Hydrotherapy-Venturi-Hartford-Loop
No ratings yet
WaterShapes - Hydraulics-Hot-Tub-Concrete-Spa-Jets-Hydrotherapy-Venturi-Hartford-Loop
7 pages
Grid Code Compliance AGC4 MK II
No ratings yet
Grid Code Compliance AGC4 MK II
4 pages
Agip GR SLL 00
No ratings yet
Agip GR SLL 00
1 page
ECON 246 Study Guide 4
No ratings yet
ECON 246 Study Guide 4
5 pages
HT Test Reopts July CTPT 2020
No ratings yet
HT Test Reopts July CTPT 2020
6 pages
Maintaining Training Facilities
No ratings yet
Maintaining Training Facilities
97 pages
Assignment 42
No ratings yet
Assignment 42
5 pages
Self-Disclosure on WeChat: A Study
No ratings yet
Self-Disclosure on WeChat: A Study
12 pages
Matrox PowerStream Plus User Guide
No ratings yet
Matrox PowerStream Plus User Guide
129 pages
An Introduction To American Law Third Edition Ebook and TestBank Bundle Unlocked Test Bank
No ratings yet
An Introduction To American Law Third Edition Ebook and TestBank Bundle Unlocked Test Bank
319 pages

Document 2

Uploaded by

Document 2

Uploaded by

JAL1611 NN & DL LABORATORY

IMPLEMENTATION OF AN OBJECT DETECTION USING CNN

def __getitem__(self, index):

orig_w, orig_h = img.size

# Data augmentation: horizontal flip

scale_x = TARGET_SIZE[0] / orig_w

boxes, labels = [], []

def evaluate_with_map(model, data_loader):

for idx in indices:

img_np = img.permute(1, 2, 0).cpu().numpy()

fig, ax = plt.subplots(1, figsize=(8, 8))

for box, score, lbl in zip(pred['boxes'], pred['scores'], pred['labels']):

for gt_box in target['boxes']:

n_val = int(VAL_RATIO * NUM_SAMPLES)

train_loader = DataLoader(train_subset, batch_size=BATCH_SIZE, shuffle=True,

loss_dict = model(images, targets)

visualize_predictions(model, full_dataset, num_images=10)

Training new model...

Epoch 1/5: 100%|██████████████████| … loss=1.234

Validation Mean IoU: 0.123

Epoch 2/5: 100%|██████████████████| … loss=0.987

Validation Mean IoU: 0.156

Epoch 5/5: 100%|██████████████████| … loss=0.543

Validation Mean IoU: 0.156

Epoch 5/5: 100%|██████████████████| … loss=0.543

Validation Mean IoU: 0.156

Epoch 5/5: 100%|██████████████████| … loss=0.543

Validation Mean IoU: 0.201

Model saved to fasterrcnn_model.pth

You might also like

def getitem(self, index):