0% found this document useful (0 votes)

52 views48 pages

CV Record

Histogram equalization is a technique used to improve contrast in images. It works by spreading out the most frequent intensity values in the image. Code: 1. Read the input image 2. Convert it to grayscale 3. Calculate the histogram of the grayscale image 4. Calculate the cumulative distribution function (CDF) from the histogram 5. Use the CDF to map pixel values to obtain an equalized histogram 6. Display the original and equalized images import cv2 import numpy as np from matplotlib import pyplot as plt img = cv2.imread('image.jpg') gray = cv2.cvtColor(img,cv2.COLOR_BGR2GRAY) hist,

Uploaded by

Lakshya Karwa

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

52 views48 pages

CV Record

Uploaded by

Lakshya Karwa

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 48

COIMBATORE INSTITUTE OF

TECHNOLOGY
M.SC ARTIFICIAL INTELLIGENCE AND
MACHINE LEARNING
COMPUTER VISION LAB RECORD

NAME: Shamruthi R

ROLL NO: 1934041

SUB CODE: 19MAM94

Primitive Image processing operations using OpenCV

Ex.no : 01
Date : 10/07/2023

Aim :

To Read and display an image , Convert a coloured image into a grayscale image , Perform
Scaling, rotation and Affine, Euclidean and Similarity translations and Read an image from a
video and display it.

Code :

1. a. Read and display the image using open cv

import cv2
from google.colab.patches import cv2_imshow
img = cv2.imread('/content/image_cv.jpg', cv2.IMREAD_UNCHANGED)
img

cv2_imshow(img)

b. Perform image resizing using open cv

print('Original Dimensions : ',img.shape)

scale_percent = 50 # percent of original size
width = int(img.shape[1] * scale_percent / 100)
height = int(img.shape[0] * scale_percent / 100)
dim = (width, height)
# resize image
resized = cv2.resize(img, dim, interpolation = cv2.INTER_AREA)
print('Resized Dimensions : ',resized.shape)
print ("Resized image with the dimension of",resized.shape,"\n")
cv2_imshow(resized)

c. Convert colored to grey scale image

# Use the cvtColor() function to grayscale the image

gray_image = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)

cv2_imshow( gray_image)

d. Image transformation - affine translation

import cv2
import numpy as np
from matplotlib import pyplot as plt
rows, cols, ch = img.shape
pts1 = np.float32([[50, 50],[200, 50],[50, 200]])

pts2 = np.float32([[10, 100],[200, 50],[100, 250]])

M = cv2.getAffineTransform(pts1, pts2)
dst = cv2.warpAffine(img, M, (cols, rows))
plt.subplot(121)
plt.imshow(img)
plt.title('Input')
plt.subplot(122)
plt.imshow(dst)
plt.title('Output')

plt.show()

Rotation translation

# using cv2.getRotationMatrix2D() to get the rotation matrix

rotate_matrix = cv2.getRotationMatrix2D(center=center, angle=45, scale=1)
# rotate the image using cv2.warpAffine
rotated_image = cv2.warpAffine(src=img, M=rotate_matrix, dsize=(width, height))
rows,cols = img.shape[:2]
M = cv2.getRotationMatrix2D((cols/2,rows/2),90,1)
dst = cv2.warpAffine(img,M,(cols,rows))
print("original image")
cv2_imshow(img)
print("Rotated image")
cv2_imshow(dst)
"""similarity translation = rotation+scale"""
rows,cols = img.shape[:2]

M = cv2.getRotationMatrix2D((cols/2,rows/2),30,1)
dst = cv2.warpAffine(img,M,(cols,rows))
scale_percent = 50 # percent of original size
width = int(dst.shape[1] * scale_percent / 100)
height = int(dst.shape[0] * scale_percent / 100)
dim = (width, height)
# resize image
resized = cv2.resize(dst, dim, interpolation = cv2.INTER_AREA)
print('Resized Dimensions : ',resized.shape)
print ("Resized image with the dimension of",resized.shape,"\n")
cv2_imshow(resized)

"""Euclidean translation = rotation + translation"""

num_rows, num_cols = img.shape[:2]

translation_matrix = np.float32([ [1,0,70], [0,1,110] ])
img_translation = cv2.warpAffine(img, translation_matrix, (num_cols, num_rows))
M = cv2.getRotationMatrix2D((cols/,rows/2),90,1)
dst = cv2.warpAffine(img_translation,M,(cols,rows))
cv2_imshow(dst)

"""d. extract image from video"""

# Importing all necessary libraries

import cv2
import os
# Read the video from specified path
cam = cv2.VideoCapture("/content/videoplayback.mp4")
try:
# creating a folder named data
if not os.path.exists('data'):
os.makedirs('data')
# if not created then raise error
except OSError:
print ('Error: Creating directory of data')
# frame
currentframe = 0
while(True):
# reading from frame
ret,frame = cam.read()
if ret:
# if video is still left continue creating images
name = './data/frame' + str(currentframe) + '.jpg'
print ('Creating...' + name)
# writing the extracted images
cv2.imwrite(name, frame)
# cv2_imshow()
# increasing counter so that it will
# show how many frames are created
currentframe += 1
else:
break
# Release all space and windows once done
cam.release()
cv2.destroyAllWindows()
# Create a VideoCapture object
cap = cv2.VideoCapture("/content/videoplayback.mp4")
# Check if camera opened successfully
if (cap.isOpened() == False):
print("Unable to read camera feed")
# Default resolutions of the frame are obtained.The default resolutions are system dependent.
# We convert the resolutions from float to integer.
frame_width = int(cap.get(3))
frame_height = int(cap.get(4))
# Define the codec and create VideoWriter object.The output is stored in 'outpy.avi' file.
out = cv2.VideoWriter('outpy.avi',cv2.VideoWriter_fourcc('M','J','P','G'), 10,
(frame_width,frame_height))
while(True):
ret, frame = cap.read()
if ret == True:
# Write the frame into the file 'output.avi'
out.write(frame)
# Display the resulting frame
cv2_imshow(frame)
# Press Q on keyboard to stop recording
if cv2.waitKey(1) & 0xFF == ord('q'):
break
# Break the loop
else:
break
# When everything done, release the video capture and video write objects
cap.release()
out.release()
# Closes all the frames
cv2.destroyAllWindows()

Output :

Result :

The above code has been executed and the output has been verified.
Object Detection using R-CNN pre-trained model

Ex.no : 02
Date : 27/07/2023

Aim :
Object detection using pre trained model
Code :

import os
import yaml
from shutil import copytree, ignore_patterns
import xml.etree.ElementTree as ET
from google.colab import drive
drive.mount('/content/drive')
root_path = '/content/drive/MyDrive/archive'
os.listdir(root_path)
train_data_path = os.path.join(root_path,'train_zip/train')
test_data_path = os.path.join(root_path,'test_zip/test')
'''All .xml and .jpg file names'''
train_data_description = os.listdir(train_data_path)
test_data_description = os.listdir(test_data_path)
'''train_annotaion_file_paths and test_annotation_file_paths contains all .xml file paths
train_image_file_paths and test_image_file_paths contains all .jpg file paths'''
train_annotation_file_paths = [os.path.join(train_data_path,i) for i in train_data_description if '.xml' in i]
train_image_file_paths = [os.path.join(train_data_path,i) for i in train_data_description if '.jpg' in i]

test_annotation_file_paths = [os.path.join(test_data_path,i) for i in test_data_description if '.xml' in i]

test_image_file_paths = [os.path.join(test_data_path,i) for i in test_data_description if '.jpg' in i]

print(f'length of training Data {len(train_image_file_paths)}, length of test data {len(test_image_file_paths)}')

'''Copying all images to required directories'''
copytree(train_data_path,'/content/drive/MyDrive/Reference/ObjectDetection/train/images/',ignore =
ignore_patterns('*.xml'))
copytree(test_data_path,'/content/drive/MyDrive/Reference/ObjectDetection/test/images/',ignore =
ignore_patterns('*.xml'))
def convert_xml_to_txt(label_path,xml_file,class_dict,destination_file):
tree = ET.parse(xml_file)
root = tree.getroot()
x=root.find('filename').text
txt_file = x.replace('.jpg','.txt')
txt_file = os.path.join(destination_file,txt_file)
with open(txt_file,'w') as f:
for obj in root.findall('object'):
class_name = obj.find('name').text
if class_name not in class_dict:
continue
class_id = class_dict[class_name]
bbox = obj.find('bndbox')
xmin = int(bbox.find('xmin').text)
xmax = int(bbox.find('xmax').text)
ymin = int(bbox.find('ymin').text)
ymax = int(bbox.find('ymax').text)

image_width = int(root.find('size/width').text)
image_height = int(root.find('size/height').text)

x_center = (xmin + xmax) / 2 / image_width if image_width != 0 else (xmin + xmax) / 2

y_center = (ymin + ymax) / 2 / image_height if image_height != 0 else (ymin + ymax) / 2
width = (xmax - xmin) / image_width if image_width != 0 else (xmax - xmin)
height = (ymax - ymin) / image_height if image_height != 0 else (ymax - ymin)

line = f"{class_id} {x_center:.6f} {y_center:.6f} {width:.6f} {height:.6f}\n"

f.write(line)
class_dict = {'apple':0,'banana':1,'orange':2}

dest_path = '/content/drive/MyDrive/Reference/ObjectDetection/test/labels/'
for i in test_annotation_file_paths:
convert_xml_to_txt(test_data_path,i,class_dict,dest_path)
yaml_path = "/content/drive/MyDrive/Reference/data.yaml"
from ultralytics import YOLO
model = YOLO('yolov8n.yaml')
'''Training model'''
results = model.train(data=yaml_path, epochs=50, batch=4)
'''Predicting single image to check how good model works'''
Test_image_results = model('/content/drive/MyDrive/Reference/ObjectDetection/test/images/mixed_23.jpg')
Test_image_results[0].boxes.data.tolist()
import cv2
import matplotlib.pyplot as plt
'''Load the image'''
image = cv2.imread('/content/drive/MyDrive/archive/test_zip/test/mixed_23.jpg')
copy_image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
img_dict = {0:'apple',1:'banana',2:'orange'}
'''Iterate over the bounding box predictions'''
for bbox in Test_image_results[0].boxes.data.tolist():
x1, y1, x2, y2,confidence,label = bbox

'''Draw rectangle'''
cv2.rectangle(image, (int(x1), int(y1)), (int(x2), int(y2)), (0, 255, 0), 2)

'''Add label'''
cv2.putText(image, img_dict[int(label)], (int(x1), int(y1 - 10)), cv2.FONT_HERSHEY_SIMPLEX, 0.9, (0,
255, 0), 2)
'''Convert BGR image to RGB'''
image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
'''Display the image using matplotlib'''
plt.imshow(image_rgb)
Output :

Result :

The above code has been executed and the output has been verified.
Histogram Equalization

Ex.no : 03
Date : 04/08/2023

Aim :
To Implement the following transformation using scratch code.a) Read any image, convert
to grayscale and display the histogram for the same.(library function may be used)
b) Apply the global histogram equalization on the image after converting it to a 2D
array(hardcode) c) Display the converted image and its histogram. Compare both.

Code :
a)
import cv2
import numpy as np

from google.colab.patches import cv2_imshow

# Reading the image from the present directory
image = cv2.imread("sharu.jpg")

image
# Resizing the image for compatibility
image = cv2.resize(image, (500, 600))

# The initial processing of the image

# image = cv2.medianBlur(image, 3)
image_bw = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)

# The declaration of CLAHE

# clipLimit -> Threshold for contrast limiting
clahe = cv2.createCLAHE(clipLimit=5)
final_img = clahe.apply(image_bw) + 30
# Ordinary thresholding the same image
_, ordinary_img = cv2.threshold(image_bw, 155, 255, cv2.THRESH_BINARY)
# Showing the two images
cv2_imshow( ordinary_img)
cv2_imshow( final_img)
b)
import numpy as np
from PIL import Image
import matplotlib.pyplot as plt
img_filename = 'devasena.jpg'
#load file as pillow Image
img = Image.open(img_filename)

img

# convert to grayscale
imgray = img.convert(mode='L')

imgray

img_array = np.asarray(imgray)
img_array
histogram_array = np.bincount(img_array.flatten(), minlength=256)
histogram_array
num_pixels = np.sum(histogram_array)
histogram_array = histogram_array/num_pixels
histogram_array
chistogram_array = np.cumsum(histogram_array)
chistogram_array
transform_map = np.floor(255 * chistogram_array).astype(np.uint8)
transform_map
img_list = list(img_array.flatten())
img_list
eq_img_list = [transform_map[p] for p in img_list]
eq_img_list
eq_img_array = np.reshape(np.asarray(eq_img_list), img_array.shape)
eq_img_array
ori_pdf = histogram_array
eq_histogram_array = np.bincount(eq_img_array.flatten(), minlength=256)
num_pixels = np.sum(eq_histogram_array)
eq_pdf = eq_histogram_array/num_pixels
eq_cdf = np.cumsum(eq_pdf)
#plot
plt.figure()
plt.plot(ori_pdf)
plt.plot(eq_pdf)
plt.xlabel('Pixel intensity')
plt.ylabel('Distribution')
plt.legend(['Original','Equalized'])
plt.figure()
plt.plot(ori_cdf)
plt.plot(eq_cdf)
plt.xlabel('Pixel intensity')
plt.ylabel('Distribution')
plt.legend(['Original','Equalized'])
save_filename='devasena-1.jpg'
eq_img = Image.fromarray(eq_img_array, mode='L')
eq_img.save(save_filename)
img = Image.open(save_filename)

Output :
Result :

The above code has been executed and the output has been verified.
Object Detection using Pre-Trained CNN models-Fruit DS

Ex.no : 04
Date : 11/08/2023

Aim :
To Implement object detection using a pretrained CNN model (e.g., SSD, YOLO, or Faster
R-CNN) on an image dataset containing multiple objects and Draw bounding boxes around the
detected objects and display the image with the identified objects.

Code :
!pip install -q torch_snippets lovely-tensors torchinfo

from torch_snippets import *

from IPython import display
import matplotlib.pyplot as plt
import matplotlib.patches as patches
display.set_matplotlib_formats('svg')

from torchinfo import summary

import torch
from PIL import Image
from torch.utils.data import Dataset, DataLoader
from torchvision import models
from torchvision.models.detection.faster_rcnn import FastRCNNPredictor
from xml.etree import ElementTree as et
device = 'cuda' if torch.cuda.is_available() else 'cpu'
# Define the root path where the data is located in Google Drive
root = '/content/drive/MyDrive/CV_LAB/train'

# List of labels, where the first label is for the background and the rest are for specific fruits
labels = ['background', 'orange', 'apple', 'banana']

# Mapping of labels to target indices (integers)

label2targets = {label: target for target, label in enumerate(labels)}
# Mapping of target indices (integers) to labels
targets2label = {target: label for label, target in label2targets.items()}

# Calculate the number of classes (excluding the background class)

num_classes = len(targets2label)

def plot_img_bbox(img, target):

fig, a = plt.subplots(1,1)
fig.set_size_inches(5,5)
a.imshow(img)
for box in target:
x, y, width, height = box[0], box[1], box[2]-box[0], box[3]-box[1]
rect = patches.Rectangle((x, y),
width, height,
linewidth = 2,
edgecolor = 'r',
facecolor = 'none')

a.add_patch(rect)
plt.show()
def preprocess_img(img):
img = torch.tensor(img).permute(2, 0, 1)
return img.float()

class FruitsDataset(Dataset):
def __init__(self, root=root, transforms=None):
self.root = root
self.transforms = transforms
self.img_paths = sorted(Glob(self.root + '/*.jpg'))
self.xml_paths = sorted(Glob(self.root + '/*.xml'))

def __len__(self):
return len(self.img_paths)

def getitem(self, idx):

w, h = 224, 224
img_path = self.img_paths[idx]
xml_path = self.xml_paths[idx]
img = Image.open(img_path).convert('RGB')
W, H = img.size
img = np.array(img.resize((w, h), resample=Image.BILINEAR)) / 255.
xml = et.parse(xml_path)
objects = xml.findall('object')
labels = []
boxes = []
for obj in objects:
label = obj.find('name').text
labels.append(label)
XMin = float(obj.find('bndbox').find('xmin').text)
YMin = float(obj.find('bndbox').find('ymin').text)
XMax = float(obj.find('bndbox').find('xmax').text)
YMax = float(obj.find('bndbox').find('ymax').text)
bbox = [XMin / W, YMin / H, XMax / W, YMax / H]
bbox = (bbox * np.array([w, h, w, h])).astype(np.int16).tolist()
boxes.append(bbox)
target = {}
target['labels'] = torch.tensor([label2targets[label] for label in labels]).long()
target['boxes'] = torch.tensor(boxes).float()
img = preprocess_img(img)
return img, target

def collate_fn(self, batch):

return tuple(zip(*batch))

train_ds = FruitsDataset()
train_dl = DataLoader(train_ds, batch_size=4, shuffle=True, collate_fn=train_ds.collate_fn)

val_ds = FruitsDataset(root=val_root)
val_dl = DataLoader(val_ds, batch_size=2, shuffle=True, collate_fn=val_ds.collate_fn)

img, target = train_ds[10]

plot_img_bbox(img.permute(1, 2, 0), target['boxes'])
def get_model():
model = models.detection.fasterrcnn_resnet50_fpn(pretrained=True)
in_features = model.roi_heads.box_predictor.cls_score.in_features
#print(in_features)
model.roi_heads.box_predictor = FastRCNNPredictor(in_features, num_classes)
return model

# test the model

imgs, targets = next(iter(train_dl))
imgs = list(img.to(device) for img in imgs)
targets = [{k: v.to(device) for k, v in t.items()} for t in targets]

model = get_model().to(device)
print(model(imgs, targets))
summary(model, (1,3,224,224))
def train_batch(batch, model, optim):
model.train()
imgs, targets = batch
imgs = list(img.to(device) for img in imgs)
targets = [{k: v.to(device) for k, v in t.items()} for t in targets]
optim.zero_grad()
losses = model(imgs, targets)
loss = sum(loss for loss in losses.values())
loss.backward()
optim.step()
return loss, losses

@torch.no_grad()
def validate_batch(batch, model, optim):
model.train()
imgs, targets = batch
imgs = list(img.to(device) for img in imgs)
targets = [{k: v.to(device) for k, v in t.items()} for t in targets]
optim.zero_grad()
losses = model(imgs, targets)
loss = sum(loss for loss in losses.values())
return loss, losses

model = get_model().to(device)
optim = torch.optim.SGD(model.parameters(), lr=0.005,
weight_decay=5e-4, momentum=0.9)

n_epochs = 1
log = Report(n_epochs)
for e in range(n_epochs):
for i, batch in enumerate(train_dl):
N = len(train_dl)
loss, losses = train_batch(batch, model, optim)
loc_loss, regr_loss, loss_objectness, loss_rpn_box_reg = [losses[k] for k in
['loss_classifier', 'loss_box_reg', 'loss_objectness',
'loss_rpn_box_reg']]
log.record(e + (i+1)/N, trn_loss=loss.item(), trn_loc_loss=loc_loss.item(),
trn_regr_loss=regr_loss.item(), trn_loss_objectness=loss_objectness.item(),
trn_loss_rpn_box_reg = loss_rpn_box_reg.item())
for i, batch in enumerate(val_dl):
N = len(val_dl)
loss, losses = validate_batch(batch, model.float(), optim)
loc_loss, regr_loss, loss_objectness, loss_rpn_box_reg = [losses[k] for k in
['loss_classifier', 'loss_box_reg',
'loss_objectness', 'loss_rpn_box_reg']]
log.record(e + (i+1)/N, val_loss=loss.item(), val_loc_loss=loc_loss.item(),
val_regr_loss=regr_loss.item(), val_loss_objectness=loss_objectness.item(),
val_loss_rpn_box_reg = loss_rpn_box_reg.item())
log.report_avgs(e+1)
log.plot_epochs(['trn_loss', 'val_loss'])

from torchvision.ops import nms

def decode_output(output):
bbs = output['boxes'].cpu().detach().numpy().astype(np.uint16)
labels = np.array([targets2label[i] for i in output['labels'].cpu().detach().numpy()])
confs = output['scores'].cpu().detach().numpy()
idxs = nms(torch.tensor(bbs.astype(np.float32)), torch.tensor(confs), 0.05)
bbs, confs, labels = [tensor[idxs] for tensor in [bbs, confs, labels]]
if len(idxs) == 1:
bbs, confs, labels = [np.array([tensor]) for tensor in [bbs, confs, labels]]
return bbs.tolist(), confs.tolist(), labels.tolist()

model.eval()
for i, (images, targets) in enumerate(val_dl):
imgs = list(img.to(device) for img in images)
targets = [{k: v.to(device) for k, v in t.items()} for t in targets]
if i == 3: break
images = [im for im in imgs]
outputs = model(images)
for i, output in enumerate(outputs):
bbs, confs, labels = decode_output(output)
plot_img_bbox(images[i].cpu().permute(1,2,0), bbs)
Output :

Result :

The above code has been executed and the output has been verified.
Image enhancement-Linear filter operations

Ex.no : 05
Date : 24/08/2023

Aim :
Apply linear filter operations on a given image and display its output -Go for filters for
Blurring(Box, Guassian, Median, Bilateral)[edge detection] , Filters for
Sharpening(Laplacian,Unsharp,Sobel or Prewitt etc , Noise reduction filters

Code :
import cv2
import numpy as np
from google.colab.patches import cv2_imshow

# Load an example image

image_path = 'rithu.jpg' # Replace with the actual path to your image
img = cv2.imread(image_path)
cv2_imshow(img)
cv2.waitKey(0)
cv2.destroyAllWindows()
box_blur = cv2.blur(img, (20, 20)) # Use a 5x5 kernel
cv2_imshow(box_blur)
cv2.waitKey(0)
cv2.destroyAllWindows()
gaussian_blur = cv2.GaussianBlur(img, (7, 9), 0)
cv2_imshow( gaussian_blur)
cv2.waitKey(0)
median_blur = cv2.medianBlur(img, 9) # Use a kernel size of 5
cv2_imshow( median_blur)
cv2.waitKey(0)
cv2.destroyAllWindows()
bilateral_blur = cv2.bilateralFilter(img, 9, 75, 75) # Experiment with the parameters
cv2_imshow( bilateral_blur)
cv2.waitKey(0)
cv2.destroyAllWindows()
laplacian = cv2.Laplacian(img, cv2.CV_64F)
cv2_imshow( laplacian)
cv2.waitKey(0)
cv2.destroyAllWindows()
unsharp_mask = cv2.addWeighted(img, 2, cv2.GaussianBlur(img, (9, 9), 10), -1, 0)
cv2_imshow( unsharp_mask)
cv2.waitKey(0)
cv2.destroyAllWindows()
sobel_x = cv2.Sobel(img, cv2.CV_64F, 1, 0, ksize=5)
sobel_y = cv2.Sobel(img, cv2.CV_64F, 0, 1, ksize=5)
cv2_imshow( sobel_x)
cv2_imshow( sobel_y)
cv2.waitKey(0)
cv2.destroyAllWindows()
gaussian_denoise = cv2.GaussianBlur(img, (5, 5), 0)
cv2_imshow( gaussian_denoise)
cv2.waitKey(0)
cv2.destroyAllWindows()
nlm_denoise = cv2.fastNlMeansDenoisingColored(img, None, 10, 10, 7, 21)
cv2_imshow( nlm_denoise)
cv2.waitKey(0)
cv2.destroyAllWindows()

Output :
Result :

The above code has been executed and the output has been verified.
Morphological Operators in Binary Image processing

Ex.no : 06
Date : 24/08/2023

Aim :
Read any image from and convert it to binary image and perform a) Apply all the four
basic morphological operators on it-Erosion,Dilation,Opening and Closing without using built-in
function and display the converted image.b) Use python Opencv library functions to perform the
above and display the output.

Code :
import cv2
import numpy as np
import matplotlib.pyplot as plt
import cv2
import numpy as np
import matplotlib.pyplot as plt

#Read the image for erosion

img1= cv2.imread("download.jpg",0)

<matplotlib.image.AxesImage at 0x7dfdfaa955a0>
#Acquire size of the image
m,n= img1.shape
#Show the image
plt.imshow(img1, cmap="gray")
# k= 11,15,45 -Different sizes of the structuring element
k=11
SE= np.ones((k,k), dtype=np.uint8)
constant= (k-1)//2
#Define new image
imgErode= np.zeros((m,n), dtype=np.uint8)
#Erosion without using inbuilt cv2 function for morphology
for i in range(constant, m-constant):
for j in range(constant,n-constant):
temp= img1[i-constant:i+constant+1, j-constant:j+constant+1]
product= temp*SE
imgErode[i,j]= np.min(product)
plt.imshow(imgErode,cmap="gray")
cv2.imwrite("Eroded3.png", imgErode)
img2= cv2.imread("download1.png",0)
#Acquire size of the image
p,q= img2.shape
#Show the image
plt.imshow(img2, cmap="gray")
#Define new image to store the pixels of dilated image
imgDilate= np.zeros((p,q), dtype=np.uint8)
#Define the structuring element
SED= np.array([[0,1,0], [1,1,1],[0,1,0]])
constant1=1
#Dilation operation without using inbuilt CV2 function
for i in range(constant1, p-constant1):
for j in range(constant1,q-constant1):
temp= img2[i-constant1:i+constant1+1, j-constant1:j+constant1+1]
product= temp*SED
imgDilate[i,j]= np.max(product)
plt.imshow(imgDilate,cmap="gray")
def erosion(img, SE):
imgErode= cv2.erode(img,SE,1)
return imgErode
def dilation(img, SE):
imgDilate= cv2.dilate(img,SE,1)
return imgDilate

img= cv2.imread("download1.png",0)
img_finger=cv2.imwrite("whaat.png", img)

SE= cv2.getStructuringElement(cv2.MORPH_RECT,(3,3))
AeB= erosion(img,SE)
AoB= dilation(AeB, SE)
AoBdB= dilation(AoB,SE)
AoBdBeB= erosion(AoBdB, SE)

<Figure size 1000x1000 with 0 Axes>

<Figure size 1000x1000 with 0 Axes>
plt.figure(figsize=(10,10))

plt.subplot(3,2,1)
plt.imshow(img, cmap="gray")
plt.subplot(3,2,2)
plt.title("E(A,B)")
plt.imshow(AeB, cmap="gray")
plt.subplot(3,2,3)
plt.title("O(A, B)")
plt.imshow(AoB, cmap="gray")
plt.subplot(3,2,4)
plt.title("D(O(A,B), B)")
plt.imshow(AoBdB, cmap="gray")
plt.subplot(3,2,5)
plt.title("C((O(A,B),B),B)")
plt.imshow(AoBdBeB, cmap="gray")

Output :
Application of Filters on videos

Ex.no : 07
Date : 24/08/2023

Aim :
To Enhance a video using different filters such as blurring filters (box and Gaussian), edge
detection (Canny), and sharpening (unsharp mask) to each frame of the video and then combines
the original and processed frames into a single output video.

Code :
import cv2
import numpy as np
from google.colab.patches import cv2_imshow
import cv2
import numpy as np

# Function to apply filters on a single frame

def apply_filters(frame):
# Box blurring
box_blurred_frame = cv2.boxFilter(frame, -1, (5, 5))
# Gaussian blurring
gaussian_blurred_frame = cv2.GaussianBlur(frame, (5, 5), 0)

# Edge detection (Canny)

edges_frame = cv2.Canny(frame, 100, 200)

# Sharpening (Unsharp Mask)

unsharp_mask_frame = cv2.addWeighted(frame, 1.5, gaussian_blurred_frame, -0.5, 0)
return box_blurred_frame, gaussian_blurred_frame, edges_frame, unsharp_mask_frame
video_path = 'input_video.mp4'
cap = cv2.VideoCapture(video_path)

# Get video properties

fps = int(cap.get(cv2.CAP_PROP_FPS))
width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
# Define the codec and create VideoWriter object
output_path = 'output_video.mp4'
fourcc = cv2.VideoWriter_fourcc(*'mp4v')
out_fps = fps // 2 # Reduced frame rate for output video
out = cv2.VideoWriter(output_path, fourcc, out_fps, (width * 5 // 2, height // 2), isColor=True) #
Corrected frame size

while cap.isOpened():
ret, frame = cap.read()
if not ret:
break
# Process the frame
box_blurred_frame, gaussian_blurred_frame, edges_frame, unsharp_mask_frame =
apply_filters(frame)
# Resize frames before stacking
resized_frame = cv2.resize(frame, (width // 2, height // 2))
resized_box_blurred_frame = cv2.resize(box_blurred_frame, (width // 2, height // 2))
resized_gaussian_blurred_frame = cv2.resize(gaussian_blurred_frame, (width // 2, height // 2))
resized_edges_frame = cv2.resize(edges_frame, (width // 2, height // 2))
resized_unsharp_mask_frame = cv2.resize(unsharp_mask_frame, (width // 2, height // 2))
# Convert the grayscale edge frame to a three-channel image
resized_edges_frame = cv2.cvtColor(resized_edges_frame, cv2.COLOR_GRAY2BGR)
# Stack the resized frames horizontally
combined_frame = np.hstack((resized_frame, resized_box_blurred_frame,
resized_gaussian_blurred_frame, resized_edges_
# Write the combined frame to the output video

out.write(combined_frame)

cv2_imshow(combined_frame)
# Release video objects and close windows
cap.release()
out.release()
if cv2.waitKey(1) & 0xFF == ord('q'):
break

cv2.destroyAllWindows()
Output :

Result :

The above code has been executed and the output has been verified.
Moving Object Detection

Ex.no : 08
Date : 24/08/2023

Aim :
To implement a pre-trained model to detect moving objects such as person or vehicle in a
video.

Code :
Output :

Result :

The above code has been executed and the output has been verified.
Alpha Blending and Masking

Ex.no : 09
Date : 24/08/2023

Aim :
Consider any two images and Aim is to blend both the images using alpha blending to
create a new image.

Code :
import cv2
import numpy as np
from google.colab.patches import cv2_imshow
# Load the two images you want to blend
image1 = cv2.imread('cat.jpg') # Replace 'image1.jpg' with the path to your first image
image2 = cv2.imread('dog.jpg') # Replace 'image2.jpg' with the path to your second image
width = 800 # Set your desired width
height = 600 # Set your desired height
image1 = cv2.resize(image1, (width, height))
image2 = cv2.resize(image2, (width, height))
# Resize the images to the same dimensions if needed
width = 400 # Set your desired width
height = 300 # Set your desired height
image1 = cv2.resize(image1, (width, height))
image2 = cv2.resize(image2, (width, height))
# Display the original images
cv2_imshow(image1)
cv2_imshow(image2)
cv2.waitKey(0)
cv2.destroyAllWindows()
# Set the alpha, beta, and gamma values for blending
alpha = 0.5 # Weight of the first image
beta = 0.5 # Weight of the second image
gamma = 0 # Scalar value
# Blend the images using alpha blending
blended_image = cv2.addWeighted(image1, alpha, image2, beta, gamma)
# Display the blended image
cv2_imshow(blended_image)
cv2.waitKey(0)
cv2.destroyAllWindows()
image = cv2.imread("cat.jpg")
cv2_imshow( image)
mask = np.zeros(image.shape[:2], dtype="uint8")
cv2.rectangle(mask, (0, 90), (290, 450), 255, -1)
cv2_imshow( mask)
masked = cv2.bitwise_and(image, image, mask=mask)
cv2_imshow( masked)
cv2.waitKey(0)
mask = np.zeros(image.shape[:2], dtype="uint8")
cv2.circle(mask, (145, 200), 100, 255, -1)
masked = cv2.bitwise_and(image, image, mask=mask)
# show the output images
cv2_imshow( mask)
cv2_imshow( masked)
cv2.waitKey(0)
from PIL import Image
from PIL import Image
image = Image.open('dog.jpg').convert('RGBA')
alpha_mask = Image.open('cat.jpg').convert('L')
alpha_mask = alpha_mask.resize(image.size, Image.ANTIALIAS)
image.putalpha(alpha_mask)
image.save('masked_image.png')

Output :

Result :

The above code has been executed and the output has been verified.
Feature Detection (Corner Detection)

Ex.no : 10
Date : 24/08/2023

Aim :
To Implement various corner detection algorithms like Harris Corner, Shi
Tomasi,SIFT,SURF etc on an image to detect corners of the images.

Code :
Output :

Result :

The above code has been executed and the output has been verified.
Image Matching

Ex.no : 11
Date : 24/08/2023

Aim :
Read an input or query image and Perform an image matching with the train image or
scene using Brute-Force image matching with ORB descriptors method using OpenCV. The
output image will display the top matched keypoints between the two images.

Code :

# importing openCV library

import cv2
from google.colab.patches import cv2_imshow

# function to read the images by taking there path

def read_image(path1,path2):
read_img1 = cv2.imread(path1)
read_img2 = cv2.imread(path2)
return (read_img1,read_img2)

# function to convert images from RGB to gray scale

def convert_to_grayscale(pic1,pic2):
gray_img1 = cv2.cvtColor(pic1,cv2.COLOR_BGR2GRAY)
gray_img2 = cv2.cvtColor(pic2,cv2.COLOR_BGR2GRAY)
return (gray_img1,gray_img2)

# function to detect the features by finding key points

# and descriptors from the image
def detector(image1,image2):

# creating ORB detector

detect = cv2.ORB_create()

# finding key points and descriptors of both images

# using detectAndCompute() function
key_point1,descrip1 = detect.detectAndCompute(image1,None)
key_point2,descrip2 = detect.detectAndCompute(image2,None)
return (key_point1,descrip1,key_point2,descrip2)

# function to find best detected features using

# brute force matcher and match them according to their humming distance
def BF_FeatureMatcher(des1,des2):
brute_force = cv2.BFMatcher(cv2.NORM_HAMMING,crossCheck=True)
no_of_matches = brute_force.match(des1,des2)

# finding the humming distance of the matches and sorting them

no_of_matches = sorted(no_of_matches,key=lambda x:x.distance)
return no_of_matches

# function displaying the output image with the feature matching

def display_output(pic1,kpt1,pic2,kpt2,best_match):
# drawing first fifteen best feature matches using drawMatches() function
output_image = cv2.drawMatches(pic1,kpt1,pic2,
kpt2,best_match[:10],None,flags=2)
cv2_imshow(output_image)
# main function
if __name__ == '__main__':
# giving the path of both of the images
first_image_path = 'alpaca.jpg'
second_image_path = '/content/alpaca2.JPG'

# reading the image from there paths

img1, img2 = read_image(first_image_path,second_image_path)

# converting the read images into the gray scale images

gray_pic1, gray_pic2 = convert_to_grayscale(img1,img2)

# storing the finded key points and descriptors of both of the images
key_pt1,descrip1,key_pt2,descrip2 = detector(gray_pic1,gray_pic2)

# sorting the number of best matches obtained from brute force matcher
number_of_matches = BF_FeatureMatcher(descrip1,descrip2)

# after drawing the feature matches displaying the output image

display_output(gray_pic1,key_pt1,gray_pic2,key_pt2,number_of_matches)
cv2.waitKey()
cv2.destroyAllWindows()
Output :

Result :

The above code has been executed and the output has been verified.
Hough Transform

Ex.no : 12
Date : 24/08/2023

Aim :
To Consider any image and Apply Hough Transform to detect shapes in the image and
display the output.

Code :

import cv2
import numpy as np
from google.colab.patches import cv2_imshow
img_path="/content/th.jpg"
image=cv2.imread(img_path)
# Convert the image to grayscale
gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)

# Apply thresholding to create a binary image

_, thresholded = cv2.threshold(gray, 127, 255, cv2.THRESH_BINARY)
# Find contours in the binary image
contours, _ = cv2.findContours(thresholded, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)

# Draw contours on a copy of the original image

contour_image = image.copy()
cv2.drawContours(contour_image, contours, -1, (0, 255, 0), 2) # -1 means draw all contours

# Display the original and contour-drawn images

cv2_imshow(image)
cv2_imshow(contour_image)
Output :

Result :

The above code has been executed and the output has been verified.
Contour Detection and Drawing

Ex.no : 13
Date : 24/08/2023

Aim :
To Apply Hough Transform to detect shapes in the image and display the output.

Code :
import cv2
import numpy as np
from google.colab.patches import cv2_imshow # Import cv2_imshow for Google Colab

# Load the image

image = cv2.imread('image.jpg')
gray_image = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)

# Apply Canny edge detection

edges = cv2.Canny(gray_image, 50, 150, apertureSize=3)

# Apply Hough Transform for line detection

lines = cv2.HoughLines(edges, 1, np.pi/180, threshold=50) # Adjust the threshold value

# Check if lines were detected

if lines is not None:
# Draw the detected lines on a copy of the original image
image_with_lines = image.copy()
for line in lines:
rho, theta = line[0]
a = np.cos(theta)
b = np.sin(theta)
x0 = a * rho
y0 = b * rho
x1 = int(x0 + 1000 * (-b))
y1 = int(y0 + 1000 * (a))
x2 = int(x0 - 1000 * (-b))
y2 = int(y0 - 1000 * (a))
cv2.line(image_with_lines, (x1, y1), (x2, y2), (0, 0, 255), 2)
# Display the images using cv2_imshow
cv2_imshow(image)
cv2_imshow(edges)
cv2_imshow(image_with_lines)
else:
print("No lines were detected.")

Output :

Result :

The above code has been executed and the output has been verified.
Image segmentation using OpenCV

Ex.no : 14
Date : 24/08/2023

Aim :
Consider an image or a frame from a video and Apply image detection using thresholding
and contour detection methods and segment the image.

Code :
import matplotlib.pyplot as plt
import numpy as np
import cv2
sample_image = cv2.imread('image.jpg')
img = cv2.cvtColor(sample_image,cv2.COLOR_BGR2RGB)
img = cv2.resize(img,(256,256))

plt.axis('off');
plt.imshow(img)
edges = cv2.dilate(cv2.Canny(thresh,0,255),None)

plt.axis('off')
plt.imshow(edges)
cnt = sorted(cv2.findContours(edges, cv2.RETR_LIST, cv2.CHAIN_APPROX_SIMPLE)[-2],
key=cv2.contourArea)[-1]
mask = np.zeros((256,256), np.uint8)
masked = cv2.drawContours(mask, [cnt],-1, 255, -1)

plt.axis('off')
plt.imshow(masked)
dst = cv2.bitwise_and(img, img, mask=mask)
segmented = cv2.cvtColor(dst, cv2.COLOR_BGR2RGB)
plt.imshow(segmented)
Output :

Result :

The above code has been executed and the output has been verified.

4-Channel YOLO Training Guide For RGB+IR Drone Detection
No ratings yet
4-Channel YOLO Training Guide For RGB+IR Drone Detection
22 pages
Digital Image Processing LAB MANUAL 6th Sem-Final
No ratings yet
Digital Image Processing LAB MANUAL 6th Sem-Final
20 pages
AI For CV Labmanual
No ratings yet
AI For CV Labmanual
23 pages
CCS349 Iva Record
No ratings yet
CCS349 Iva Record
64 pages
OpenCV - Cheatsheet
100% (1)
OpenCV - Cheatsheet
12 pages
Cvrlabmanual
No ratings yet
Cvrlabmanual
30 pages
CV Lab Manual
No ratings yet
CV Lab Manual
45 pages
IVALAB
No ratings yet
IVALAB
21 pages
Geometric Transformations: Haarcascade - Frontalface - Default - XML
No ratings yet
Geometric Transformations: Haarcascade - Frontalface - Default - XML
10 pages
IVA Record
No ratings yet
IVA Record
31 pages
Bit 22034
No ratings yet
Bit 22034
18 pages
IOT Hands On Approach
No ratings yet
IOT Hands On Approach
514 pages
Yolo Tensorflow
No ratings yet
Yolo Tensorflow
13 pages
Lab Record
No ratings yet
Lab Record
30 pages
Final Question1 With Results
No ratings yet
Final Question1 With Results
21 pages
Yolo Detect
No ratings yet
Yolo Detect
5 pages
Transfer Learning Q3 2
No ratings yet
Transfer Learning Q3 2
36 pages
University of Engineering and Technology, Taxila Department of Software Engineering
No ratings yet
University of Engineering and Technology, Taxila Department of Software Engineering
5 pages
Computer Vision Full Record
No ratings yet
Computer Vision Full Record
34 pages
Source Code
No ratings yet
Source Code
10 pages
B120041 IVP Assignment
No ratings yet
B120041 IVP Assignment
14 pages
Open CV
No ratings yet
Open CV
22 pages
Mia-Unet: Multi-Scale Iterative Aggregation U-Network For Retinal Vessel Segmentation
No ratings yet
Mia-Unet: Multi-Scale Iterative Aggregation U-Network For Retinal Vessel Segmentation
24 pages
OPENCV Lab1
No ratings yet
OPENCV Lab1
18 pages
Exp 1
No ratings yet
Exp 1
46 pages
0 Image Processing 1753170901
No ratings yet
0 Image Processing 1753170901
27 pages
Ex 3
No ratings yet
Ex 3
5 pages
Here Are Common Image Preprocessing Techniques Used in Machine Learning and Deep Learning
No ratings yet
Here Are Common Image Preprocessing Techniques Used in Machine Learning and Deep Learning
7 pages
Ip Lab Programs
No ratings yet
Ip Lab Programs
34 pages
Video
No ratings yet
Video
2 pages
Computer Vision Al 701
No ratings yet
Computer Vision Al 701
50 pages
Srafvana
No ratings yet
Srafvana
6 pages
Coding
No ratings yet
Coding
6 pages
Model Training
No ratings yet
Model Training
17 pages
Paper 11-Image Based Individual Cow Recognition
No ratings yet
Paper 11-Image Based Individual Cow Recognition
7 pages
Laser Weeder (Amigos)
No ratings yet
Laser Weeder (Amigos)
15 pages
Angular Generative AI: Building an intelligent CV enhancer with Google Gemini
From Everand
Angular Generative AI: Building an intelligent CV enhancer with Google Gemini
Abdelfattah Ragab
No ratings yet
Copy of CVPR1
No ratings yet
Copy of CVPR1
7 pages
CV Pt1
No ratings yet
CV Pt1
24 pages
Task 9 Implementation of Object Detection and Localization
No ratings yet
Task 9 Implementation of Object Detection and Localization
7 pages
Exp 2
No ratings yet
Exp 2
8 pages
CV Lab File
No ratings yet
CV Lab File
39 pages
导入所需库
No ratings yet
导入所需库
20 pages
REF1 - OpenCV Basics
No ratings yet
REF1 - OpenCV Basics
16 pages
Cap 5416
No ratings yet
Cap 5416
12 pages
Detection and Prediction of Rice Leaf Disease Using A Hybrid CNN-SVM Model
No ratings yet
Detection and Prediction of Rice Leaf Disease Using A Hybrid CNN-SVM Model
19 pages
Book
No ratings yet
Book
96 pages
CV Practical
No ratings yet
CV Practical
3 pages
Assignment 8
No ratings yet
Assignment 8
1 page
CV Lab
No ratings yet
CV Lab
14 pages
Lab 1 Exp
No ratings yet
Lab 1 Exp
5 pages
ALCANTARAuLaboratory 6 Image Processing Student - 031006
No ratings yet
ALCANTARAuLaboratory 6 Image Processing Student - 031006
9 pages
Traffic Sign Classifier On Android
No ratings yet
Traffic Sign Classifier On Android
41 pages
DIP Lab Manual No 03
No ratings yet
DIP Lab Manual No 03
11 pages
Untitled Document
No ratings yet
Untitled Document
4 pages
21BRS1203 RP Lab9 RCNN
No ratings yet
21BRS1203 RP Lab9 RCNN
4 pages
Dip Lab
No ratings yet
Dip Lab
5 pages
CV Task
No ratings yet
CV Task
6 pages
Swin Transformer Hierarchical Vision Transformer Using Shifted Windows
No ratings yet
Swin Transformer Hierarchical Vision Transformer Using Shifted Windows
11 pages
18DIP Lab 2
No ratings yet
18DIP Lab 2
11 pages
BreastCancer Classification - 2025
No ratings yet
BreastCancer Classification - 2025
24 pages
Image Preprocessing Commands: Aim: Source Code
No ratings yet
Image Preprocessing Commands: Aim: Source Code
4 pages
Idowu Et Al 2022
No ratings yet
Idowu Et Al 2022
12 pages
Exp 4
No ratings yet
Exp 4
4 pages
Colorized Image by JUNAID
No ratings yet
Colorized Image by JUNAID
4 pages
A2.1 - BI-160-00347 2D Long Construct Feasibility Report Rev 3
No ratings yet
A2.1 - BI-160-00347 2D Long Construct Feasibility Report Rev 3
64 pages
22 Paper-25
No ratings yet
22 Paper-25
6 pages
Experiment 8
No ratings yet
Experiment 8
3 pages
DIP Lab Manual
No ratings yet
DIP Lab Manual
42 pages
Degree Final Project: FPGA Implementation of A Contrast Enhancement Algorithm With Discriminative Filtering
No ratings yet
Degree Final Project: FPGA Implementation of A Contrast Enhancement Algorithm With Discriminative Filtering
111 pages
DETECTCAMERA
No ratings yet
DETECTCAMERA
3 pages
CV PT 2
No ratings yet
CV PT 2
10 pages
LẬP TRÌNH XỬ LÝ ẢNH
No ratings yet
LẬP TRÌNH XỬ LÝ ẢNH
8 pages
Detection ORIGINAL
No ratings yet
Detection ORIGINAL
3 pages
ComputerGraphicsNotesWeek9 01 0418
No ratings yet
ComputerGraphicsNotesWeek9 01 0418
6 pages
LAB1
No ratings yet
LAB1
7 pages
Rope Augmented Path Following and Control of Remotely Operated Underwater Vehicle Using Vision For Stilling Basin Surveillance
No ratings yet
Rope Augmented Path Following and Control of Remotely Operated Underwater Vehicle Using Vision For Stilling Basin Surveillance
5 pages
Drug-Target Interaction Prediction With Graph Attention Networks
No ratings yet
Drug-Target Interaction Prediction With Graph Attention Networks
9 pages
TP02 - Image Processing Using Python-OpenCV
No ratings yet
TP02 - Image Processing Using Python-OpenCV
3 pages
Image Enhancement Effect On The Performance of Convolutional Neural Networks
No ratings yet
Image Enhancement Effect On The Performance of Convolutional Neural Networks
40 pages
Image Enhancement
No ratings yet
Image Enhancement
5 pages
Shibu George Et Al. - 2023
No ratings yet
Shibu George Et Al. - 2023
16 pages
Lung Cancer Detection Using Image Processing Synopsis Report
No ratings yet
Lung Cancer Detection Using Image Processing Synopsis Report
19 pages
Chapter 12 Computational Methods For Stitching Alignmen 2019 Methods in C
No ratings yet
Chapter 12 Computational Methods For Stitching Alignmen 2019 Methods in C
16 pages
Brightness Preserving Contrast Enhancement of Medical Images Using Adaptive Gamma Correction and Homomorphic Filtering
No ratings yet
Brightness Preserving Contrast Enhancement of Medical Images Using Adaptive Gamma Correction and Homomorphic Filtering
4 pages
TensorFlow深度学习项目实战: Chinese Edition
From Everand
TensorFlow深度学习项目实战: Chinese Edition
Posts & Telecom Press
No ratings yet
Image Enhancement Using CLAHE-DWT Technique
No ratings yet
Image Enhancement Using CLAHE-DWT Technique
6 pages
Project Synopsis
No ratings yet
Project Synopsis
11 pages
CLAHE
No ratings yet
CLAHE
22 pages
ED6001 Project Report
No ratings yet
ED6001 Project Report
9 pages
Video Enhancement Using Contrast Limited Adaptive Histogram Equalization
No ratings yet
Video Enhancement Using Contrast Limited Adaptive Histogram Equalization
14 pages
Gamma Correction Enhancement of Infrared
No ratings yet
Gamma Correction Enhancement of Infrared
14 pages
Kana Saputra 2022 J. Phys. Conf. Ser. 2193 012070
No ratings yet
Kana Saputra 2022 J. Phys. Conf. Ser. 2193 012070
8 pages
Bakken 2020
No ratings yet
Bakken 2020
6 pages
Region Based Adaptive Contrast Enhancement of Medical Ultrasound Images
No ratings yet
Region Based Adaptive Contrast Enhancement of Medical Ultrasound Images
4 pages
Color Retinal Image Enhancement Using CL
No ratings yet
Color Retinal Image Enhancement Using CL
3 pages

CV Record

Uploaded by

CV Record

Uploaded by

COIMBATORE INSTITUTE OF

ROLL NO: 1934041

SUB CODE: 19MAM94

1. a. Read and display the image using open cv

b. Perform image resizing using open cv

print('Original Dimensions : ',img.shape)

c. Convert colored to grey scale image

# Use the cvtColor() function to grayscale the image

d. Image transformation - affine translation

pts2 = np.float32([[10, 100],[200, 50],[100, 250]])

# using cv2.getRotationMatrix2D() to get the rotation matrix

"""Euclidean translation = rotation + translation"""

num_rows, num_cols = img.shape[:2]

"""d. extract image from video"""

# Importing all necessary libraries

test_annotation_file_paths = [os.path.join(test_data_path,i) for i in test_data_description if '.xml' in i]

print(f'length of training Data {len(train_image_file_paths)}, length of test data {len(test_image_file_paths)}')

x_center = (xmin + xmax) / 2 / image_width if image_width != 0 else (xmin + xmax) / 2

line = f"{class_id} {x_center:.6f} {y_center:.6f} {width:.6f} {height:.6f}\n"

from google.colab.patches import cv2_imshow

# The initial processing of the image

# The declaration of CLAHE

from torch_snippets import *

from torchinfo import summary

# Mapping of labels to target indices (integers)

# Calculate the number of classes (excluding the background class)

def plot_img_bbox(img, target):

def __getitem__(self, idx):

def collate_fn(self, batch):

img, target = train_ds[10]

# test the model

from torchvision.ops import nms

# Load an example image

#Read the image for erosion

<Figure size 1000x1000 with 0 Axes>

# Function to apply filters on a single frame

# Edge detection (Canny)

# Sharpening (Unsharp Mask)

# Get video properties

# importing openCV library

# function to read the images by taking there path

# function to convert images from RGB to gray scale

# function to detect the features by finding key points

# creating ORB detector

# finding key points and descriptors of both images

# function to find best detected features using

# finding the humming distance of the matches and sorting them

# function displaying the output image with the feature matching

# reading the image from there paths

# converting the read images into the gray scale images

# after drawing the feature matches displaying the output image

# Apply thresholding to create a binary image

# Draw contours on a copy of the original image

# Display the original and contour-drawn images

# Load the image

# Apply Canny edge detection

# Apply Hough Transform for line detection

# Check if lines were detected

You might also like

def getitem(self, idx):