0% found this document useful (0 votes)

14 views5 pages

Yolo Detect

This document is a Python script that utilizes the YOLO model for object detection in images, videos, or from USB cameras. It includes argument parsing for model path, source type, confidence threshold, resolution, and recording options, as well as handling various input sources and displaying detection results with bounding boxes. The script also calculates and displays the average frame rate during processing.

Uploaded by

hantarmustapha

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

14 views5 pages

Yolo Detect

Uploaded by

hantarmustapha

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 5

import os

import sys
import argparse
import glob
import time

import cv2
import numpy as np
from ultralytics import YOLO

# Define and parse user input arguments

parser = argparse.ArgumentParser()
parser.add_argument('--model', help='Path to YOLO model file (example:
"runs/detect/train/weights/best.pt")',
required=True)
parser.add_argument('--source', help='Image source, can be image file ("test.jpg"),
\
image folder ("test_dir"), video file ("testvid.mp4"), or index
of USB camera ("usb0")',
required=True)
parser.add_argument('--thresh', help='Minimum confidence threshold for displaying
detected objects (example: "0.4")',
default=0.5)
parser.add_argument('--resolution', help='Resolution in WxH to display inference
results at (example: "640x480"), \
otherwise, match source resolution',
default=None)
parser.add_argument('--record', help='Record results from video or webcam and save
it as "demo1.avi". Must specify --resolution argument to record.',
action='store_true')

args = parser.parse_args()

# Parse user inputs

model_path = args.model
img_source = args.source
min_thresh = args.thresh
user_res = args.resolution
record = args.record

# Check if model file exists and is valid

if (not os.path.exists(model_path)):
print('ERROR: Model path is invalid or model was not found. Make sure the model
filename was entered correctly.')
sys.exit(0)

# Load the model into memory and get labemap

model = YOLO(model_path, task='detect')
labels = model.names

# Parse input to determine if image source is a file, folder, video, or USB camera
img_ext_list = ['.jpg','.JPG','.jpeg','.JPEG','.png','.PNG','.bmp','.BMP']
vid_ext_list = ['.avi','.mov','.mp4','.mkv','.wmv']

if os.path.isdir(img_source):
source_type = 'folder'
elif os.path.isfile(img_source):
_, ext = os.path.splitext(img_source)
if ext in img_ext_list:
source_type = 'image'
elif ext in vid_ext_list:
source_type = 'video'
else:
print(f'File extension {ext} is not supported.')
sys.exit(0)
elif 'usb' in img_source:
source_type = 'usb'
usb_idx = int(img_source[3:])
elif 'picamera' in img_source:
source_type = 'picamera'
picam_idx = int(img_source[8:])
else:
print(f'Input {img_source} is invalid. Please try again.')
sys.exit(0)

# Parse user-specified display resolution

resize = False
if user_res:
resize = True
resW, resH = int(user_res.split('x')[0]), int(user_res.split('x')[1])

# Check if recording is valid and set up recording

if record:
if source_type not in ['video','usb']:
print('Recording only works for video and camera sources. Please try
again.')
sys.exit(0)
if not user_res:
print('Please specify resolution to record video at.')
sys.exit(0)

# Set up recording
record_name = 'demo1.avi'
record_fps = 30
recorder = cv2.VideoWriter(record_name, cv2.VideoWriter_fourcc(*'MJPG'),
record_fps, (resW,resH))

# Load or initialize image source

if source_type == 'image':
imgs_list = [img_source]
elif source_type == 'folder':
imgs_list = []
filelist = glob.glob(img_source + '/*')
for file in filelist:
_, file_ext = os.path.splitext(file)
if file_ext in img_ext_list:
imgs_list.append(file)
elif source_type == 'video' or source_type == 'usb':

if source_type == 'video': cap_arg = img_source

elif source_type == 'usb': cap_arg = usb_idx
cap = cv2.VideoCapture("http://192.168.1.11/cam-hi.jpg")

# Set camera or video resolution if specified by user

if user_res:
ret = cap.set(3, resW)
ret = cap.set(4, resH)

elif source_type == 'picamera':

from picamera2 import Picamera2
cap = Picamera2()
cap.configure(cap.create_video_configuration(main={"format": 'XRGB8888',
"size": (resW, resH)}))
cap.start()

# Set bounding box colors (using the Tableu 10 color scheme)

bbox_colors = [(164,120,87), (68,148,228), (93,97,209), (178,182,133),
(88,159,106),
(96,202,231), (159,124,168), (169,162,241), (98,118,150),
(172,176,184)]

# Initialize control and status variables

avg_frame_rate = 0
frame_rate_buffer = []
fps_avg_len = 200
img_count = 0

# Begin inference loop

while True:

t_start = time.perf_counter()

# Load frame from image source

if source_type == 'image' or source_type == 'folder': # If source is image or
image folder, load the image using its filename
if img_count >= len(imgs_list):
print('All images have been processed. Exiting program.')
sys.exit(0)
img_filename = imgs_list[img_count]
frame = cv2.imread(img_filename)
img_count = img_count + 1

elif source_type == 'video': # If source is a video, load next frame from video
file
ret, frame = cap.read()
if not ret:
print('Reached end of the video file. Exiting program.')
break

elif source_type == 'usb': # If source is a USB camera, grab frame from camera
ret, frame = cap.read()
if (frame is None) or (not ret):
print('Unable to read frames from the camera. This indicates the camera
is disconnected or not working. Exiting program.')
break

elif source_type == 'picamera': # If source is a Picamera, grab frames using

picamera interface
frame_bgra = cap.capture_array()
frame = cv2.cvtColor(np.copy(frame_bgra), cv2.COLOR_BGRA2BGR)
if (frame is None):
print('Unable to read frames from the Picamera. This indicates the
camera is disconnected or not working. Exiting program.')
break
# Resize frame to desired display resolution
if resize == True:
frame = cv2.resize(frame,(resW,resH))

# Run inference on frame

results = model(frame, verbose=False)

# Extract results
detections = results[0].boxes

# Initialize variable for basic object counting example

object_count = 0

# Go through each detection and get bbox coords, confidence, and class
for i in range(len(detections)):

# Get bounding box coordinates

# Ultralytics returns results in Tensor format, which have to be converted
to a regular Python array
xyxy_tensor = detections[i].xyxy.cpu() # Detections in Tensor format in CPU
memory
xyxy = xyxy_tensor.numpy().squeeze() # Convert tensors to Numpy array
xmin, ymin, xmax, ymax = xyxy.astype(int) # Extract individual coordinates
and convert to int

# Get bounding box class ID and name

classidx = int(detections[i].cls.item())
classname = labels[classidx]

# Get bounding box confidence

conf = detections[i].conf.item()

# Draw box if confidence threshold is high enough

if conf > 0.5:

color = bbox_colors[classidx % 10]

cv2.rectangle(frame, (xmin,ymin), (xmax,ymax), color, 2)

label = f'{classname}: {int(conf*100)}%'

labelSize, baseLine = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX,
0.5, 1) # Get font size
label_ymin = max(ymin, labelSize[1] + 10) # Make sure not to draw label
too close to top of window
cv2.rectangle(frame, (xmin, label_ymin-labelSize[1]-10),
(xmin+labelSize[0], label_ymin+baseLine-10), color, cv2.FILLED) # Draw white box to
put label text in
cv2.putText(frame, label, (xmin, label_ymin-7),
cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1) # Draw label text

# Basic example: count the number of objects in the image

object_count = object_count + 1

# Calculate and draw framerate (if using video, USB, or Picamera source)
if source_type == 'video' or source_type == 'usb' or source_type == 'picamera':
cv2.putText(frame, f'FPS: {avg_frame_rate:0.2f}', (10,20),
cv2.FONT_HERSHEY_SIMPLEX, .7, (0,255,255), 2) # Draw framerate

# Display detection results

cv2.putText(frame, f'Number of objects: {object_count}', (10,40),
cv2.FONT_HERSHEY_SIMPLEX, .7, (0,255,255), 2) # Draw total number of detected
objects
cv2.imshow('YOLO detection results',frame) # Display image
if record: recorder.write(frame)

# If inferencing on individual images, wait for user keypress before moving to

next image. Otherwise, wait 5ms before moving to next frame.
if source_type == 'image' or source_type == 'folder':
key = cv2.waitKey()
elif source_type == 'video' or source_type == 'usb' or source_type ==
'picamera':
key = cv2.waitKey(5)

if key == ord('q') or key == ord('Q'): # Press 'q' to quit

break
elif key == ord('s') or key == ord('S'): # Press 's' to pause inference
cv2.waitKey()
elif key == ord('p') or key == ord('P'): # Press 'p' to save a picture of
results on this frame
cv2.imwrite('capture.png',frame)

# Calculate FPS for this frame

t_stop = time.perf_counter()
frame_rate_calc = float(1/(t_stop - t_start))

# Append FPS result to frame_rate_buffer (for finding average FPS over multiple
frames)
if len(frame_rate_buffer) >= fps_avg_len:
temp = frame_rate_buffer.pop(0)
frame_rate_buffer.append(frame_rate_calc)
else:
frame_rate_buffer.append(frame_rate_calc)

# Calculate average FPS for past frames

avg_frame_rate = np.mean(frame_rate_buffer)

# Clean up
print(f'Average pipeline FPS: {avg_frame_rate:.2f}')
if source_type == 'video' or source_type == 'usb':
cap.release()
elif source_type == 'picamera':
cap.stop()
if record: recorder.release()
cv2.destroyAllWindows()

4-Channel YOLO Training Guide For RGB+IR Drone Detection
No ratings yet
4-Channel YOLO Training Guide For RGB+IR Drone Detection
22 pages
OpenCV - Cheatsheet
100% (1)
OpenCV - Cheatsheet
12 pages
Raw Bayer Data Captures: OV5647 IMX219
No ratings yet
Raw Bayer Data Captures: OV5647 IMX219
4 pages
Video
No ratings yet
Video
28 pages
IPCV
No ratings yet
IPCV
26 pages
New Text Document
No ratings yet
New Text Document
11 pages
CV Lab Manual
No ratings yet
CV Lab Manual
45 pages
Mine
No ratings yet
Mine
4 pages
Signals
No ratings yet
Signals
17 pages
Lab Manual1
No ratings yet
Lab Manual1
10 pages
Geometric Transformations: Haarcascade - Frontalface - Default - XML
No ratings yet
Geometric Transformations: Haarcascade - Frontalface - Default - XML
10 pages
Code 1
No ratings yet
Code 1
18 pages
Workflow
No ratings yet
Workflow
7 pages
Bit 22034
No ratings yet
Bit 22034
18 pages
Model Training
No ratings yet
Model Training
17 pages
CV Record
No ratings yet
CV Record
48 pages
Lecture08 OpenCV
No ratings yet
Lecture08 OpenCV
27 pages
Noor Shammet - EE 4370 Lab 9 Report
No ratings yet
Noor Shammet - EE 4370 Lab 9 Report
17 pages
Video
No ratings yet
Video
2 pages
Face Login System Using Python - Technozune
No ratings yet
Face Login System Using Python - Technozune
8 pages
Appendix A
No ratings yet
Appendix A
2 pages
Task 9 Implementation of Object Detection and Localization
No ratings yet
Task 9 Implementation of Object Detection and Localization
7 pages
Import Cv2
No ratings yet
Import Cv2
2 pages
Huggin Face Code
No ratings yet
Huggin Face Code
3 pages
Import Cv2
No ratings yet
Import Cv2
5 pages
2.camera Python Driver Tutorial
No ratings yet
2.camera Python Driver Tutorial
5 pages
Coding
No ratings yet
Coding
6 pages
New Text Document
No ratings yet
New Text Document
4 pages
Ejemplo 1 Chapas
No ratings yet
Ejemplo 1 Chapas
3 pages
Machine Vison Homework 10
No ratings yet
Machine Vison Homework 10
11 pages
Transfer Learning Q3 2
No ratings yet
Transfer Learning Q3 2
36 pages
Dde Prospectus 2012 13 220612
No ratings yet
Dde Prospectus 2012 13 220612
73 pages
12 FaceDetection - Py
No ratings yet
12 FaceDetection - Py
2 pages
Laser Weeder (Amigos)
No ratings yet
Laser Weeder (Amigos)
15 pages
Yolo 2
No ratings yet
Yolo 2
1 page
Data Structures Notes
No ratings yet
Data Structures Notes
131 pages
Colordetc Documentation
No ratings yet
Colordetc Documentation
2 pages
CV Task
No ratings yet
CV Task
6 pages
Exp 4
No ratings yet
Exp 4
4 pages
Appendix A
No ratings yet
Appendix A
8 pages
导入所需库
No ratings yet
导入所需库
20 pages
Exp 2
No ratings yet
Exp 2
8 pages
Import cv2
No ratings yet
Import cv2
6 pages
Technology Stack - Template
No ratings yet
Technology Stack - Template
3 pages
Exp 3
No ratings yet
Exp 3
21 pages
# Code To Control Webcam Based On U
No ratings yet
# Code To Control Webcam Based On U
3 pages
TP02 - Image Processing Using Python-OpenCV
No ratings yet
TP02 - Image Processing Using Python-OpenCV
3 pages
PDF Fixed Point Signal Processors 1st Edition Wayne T. Padgett Download
100% (9)
PDF Fixed Point Signal Processors 1st Edition Wayne T. Padgett Download
47 pages
Detection
No ratings yet
Detection
1 page
Classify Qwe
No ratings yet
Classify Qwe
3 pages
Machine Learning Program 6 (SHANKAR)
No ratings yet
Machine Learning Program 6 (SHANKAR)
8 pages
21CSS101J Programming For Problem Solving
No ratings yet
21CSS101J Programming For Problem Solving
135 pages
Delta Extractors CO Poor Performance
No ratings yet
Delta Extractors CO Poor Performance
4 pages
Codeyolov 5
No ratings yet
Codeyolov 5
16 pages
PCV Lab Codes
No ratings yet
PCV Lab Codes
51 pages
Detect
No ratings yet
Detect
6 pages
Untitled Document
No ratings yet
Untitled Document
4 pages
Gesture Servo
No ratings yet
Gesture Servo
2 pages
Introduction To Angular
No ratings yet
Introduction To Angular
42 pages
Colorized Image by JUNAID
No ratings yet
Colorized Image by JUNAID
4 pages
Java Programming MCQ - 90min
No ratings yet
Java Programming MCQ - 90min
14 pages
The Code
No ratings yet
The Code
4 pages
Online Voting System Project
No ratings yet
Online Voting System Project
19 pages
DETECTCAMERA
No ratings yet
DETECTCAMERA
3 pages
Detection ORIGINAL
No ratings yet
Detection ORIGINAL
3 pages
Object Detection Webcam
No ratings yet
Object Detection Webcam
3 pages
Air Canvas Project
No ratings yet
Air Canvas Project
6 pages
Settingsprovider
No ratings yet
Settingsprovider
28 pages
Heap Data Structure: Zahoor Jan
No ratings yet
Heap Data Structure: Zahoor Jan
38 pages
Heap Sort Min-Heap or Max-Heap
No ratings yet
Heap Sort Min-Heap or Max-Heap
11 pages
Silabus Sekolah Fullstack
No ratings yet
Silabus Sekolah Fullstack
21 pages
Object Detection Webcam
No ratings yet
Object Detection Webcam
3 pages
Creating Your First Qlik Sense App: Loading Data
No ratings yet
Creating Your First Qlik Sense App: Loading Data
54 pages
SQL Server Online Training
No ratings yet
SQL Server Online Training
2 pages
Assignment-3 Ch-1 & 2
No ratings yet
Assignment-3 Ch-1 & 2
3 pages
Gujarat Technological University: Diploma in Computer Engineering Semester: 3
No ratings yet
Gujarat Technological University: Diploma in Computer Engineering Semester: 3
3 pages
Using The UVM Libraries With Questa Verification Horizons BLOG
No ratings yet
Using The UVM Libraries With Questa Verification Horizons BLOG
11 pages
CS F213 - Compre - Q
No ratings yet
CS F213 - Compre - Q
4 pages
Cse3521 hw1
No ratings yet
Cse3521 hw1
3 pages
Microservice Architecture Patterns and Best Practices
No ratings yet
Microservice Architecture Patterns and Best Practices
4 pages
Linked List: Method To Insert (Add) A Node in The Beginning of A Linked List
No ratings yet
Linked List: Method To Insert (Add) A Node in The Beginning of A Linked List
6 pages
Functions of String in C++
No ratings yet
Functions of String in C++
9 pages
Course Outline
No ratings yet
Course Outline
6 pages
Resume Zaki Maliki PDF
No ratings yet
Resume Zaki Maliki PDF
4 pages
Answer:: Free Exam/Cram Practice Materials - Best Exam Practice Materials
No ratings yet
Answer:: Free Exam/Cram Practice Materials - Best Exam Practice Materials
2 pages
1 James M. Curran: 1 Summary
No ratings yet
1 James M. Curran: 1 Summary
7 pages
NN Tool Example
No ratings yet
NN Tool Example
3 pages
Readme
No ratings yet
Readme
3 pages
(NS) NodePosition
No ratings yet
(NS) NodePosition
6 pages
TensorFlow深度学习项目实战: Chinese Edition
From Everand
TensorFlow深度学习项目实战: Chinese Edition
Posts & Telecom Press
No ratings yet

Yolo Detect

Uploaded by

Yolo Detect

Uploaded by

import os

# Define and parse user input arguments

# Parse user inputs

# Check if model file exists and is valid

# Load the model into memory and get labemap

# Parse user-specified display resolution

# Check if recording is valid and set up recording

# Load or initialize image source

if source_type == 'video': cap_arg = img_source

# Set camera or video resolution if specified by user

elif source_type == 'picamera':

# Set bounding box colors (using the Tableu 10 color scheme)

# Initialize control and status variables

# Begin inference loop

# Load frame from image source

elif source_type == 'picamera': # If source is a Picamera, grab frames using

# Run inference on frame

# Initialize variable for basic object counting example

# Get bounding box coordinates

# Get bounding box class ID and name

# Get bounding box confidence

# Draw box if confidence threshold is high enough

color = bbox_colors[classidx % 10]

label = f'{classname}: {int(conf*100)}%'

# Basic example: count the number of objects in the image

# Display detection results

# If inferencing on individual images, wait for user keypress before moving to

if key == ord('q') or key == ord('Q'): # Press 'q' to quit

# Calculate FPS for this frame

# Calculate average FPS for past frames

You might also like