0% found this document useful (0 votes)

5 views11 pages

New Text Document

The provided code consists of multiple Python scripts that utilize OpenCV and MediaPipe for hand gesture recognition and media control. The scripts include functionalities for listing video capture devices, processing images to extract hand landmarks, and controlling media playback based on detected gestures. The implementation involves loading a trained model, capturing video from a camera, and executing actions like play/pause or skipping songs based on recognized hand gestures.

Uploaded by

chhashimi34

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

5 views11 pages

New Text Document

Uploaded by

chhashimi34

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 11

check cameras.

py:

import cv2

def list_video_capture_devices():
# Try using different backends to list available devices
index = 0
arr = []

# Try using CAP_DSHOW backend

print("Checking devices using CAP_DSHOW backend...")
while True:
cap = cv2.VideoCapture(index, cv2.CAP_DSHOW)
if not cap.read()[0]:
break
else:
arr.append(index)
cap.release()
index += 1

if len(arr) > 0:
print("Available video capture devices using CAP_DSHOW:", arr)
return

# Try using CAP_MSMF backend

index = 0
arr = []
print("Checking devices using CAP_MSMF backend...")
while True:
cap = cv2.VideoCapture(index, cv2.CAP_MSMF)
if not cap.read()[0]:
break
else:
arr.append(index)
cap.release()
index += 1

if len(arr) > 0:
print("Available video capture devices using CAP_MSMF:", arr)
return

# Try using CAP_V4L2 backend (Linux)

index = 0
arr = []
print("Checking devices using CAP_V4L2 backend...")
while True:
cap = cv2.VideoCapture(index, cv2.CAP_V4L2)
if not cap.read()[0]:
break
else:
arr.append(index)
cap.release()
index += 1

if len(arr) > 0:
print("Available video capture devices using CAP_V4L2:", arr)
return

print("No available video capture devices found.")

list_video_capture_devices()

check dataset.py:

import pickle
import os
import mediapipe as mp
import cv2

mp_hands = mp.solutions.hands
mp_drawing = mp.solutions.drawing_utils
mp_drawing_styles = mp.solutions.drawing_styles

hands = mp_hands.Hands(static_image_mode=True, min_detection_confidence=0.3)

img_dir = '.\\Data'
output_dir = 'processed_images' # Define a folder to save images

# Create the output folder if it doesn't exist

output_dir_path = os.path.join(img_dir, output_dir)
os.makedirs(output_dir_path, exist_ok=True)

# Debug: Check the root directory contents

print(f"Contents of the dataset directory: {os.listdir(img_dir)}")

data = []
labels = []

for dir_ in os.listdir(img_dir):

dir_path = os.path.join(img_dir, dir_)
# Debug: Check each item in the root directory
print(f"Checking {dir_}: Is directory? {os.path.isdir(dir_path)}")

if os.path.isdir(dir_path):
print(f"Contents of the directory {dir_}: {os.listdir(dir_path)}")
for img_path in os.listdir(dir_path):
data_aux = []

x_ = []
y_ = []

load_img = cv2.imread(os.path.join(dir_path, img_path))

if load_img is None:
print(f"Failed to load image: {img_path}")
else:
print(f"Loaded image: {img_path}")
rgb_img = cv2.cvtColor(load_img, cv2.COLOR_BGR2RGB)
dataset_img = hands.process(rgb_img)
if dataset_img.multi_hand_landmarks:
for hand_landmarks in dataset_img.multi_hand_landmarks:
for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y

x_.append(x)
y_.append(y)
for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y
data_aux.append(x - min(x_))
data_aux.append(y - min(y_))

data.append(data_aux)
labels.append(dir_)

# Draw hand landmarks on the image

for hand_landmarks in dataset_img.multi_hand_landmarks:
mp_drawing.draw_landmarks(
rgb_img, hand_landmarks, mp_hands.HAND_CONNECTIONS)

# Save processed image with hand landmarks drawn

output_img_path = os.path.join(output_dir_path,
f"{dir_}_{img_path}")
cv2.imwrite(output_img_path, cv2.cvtColor(rgb_img,
cv2.COLOR_RGB2BGR))
print(f"Saved processed image: {output_img_path}")

data_dict = {'data': data, 'labels': labels}

print(data_dict)
print("Data saved successfully !")

collect images.py:

create dataset.py:

import os
import cv2
import mediapipe as mp
import pickle

mp_hands = mp.solutions.hands
mp_drawing = mp.solutions.drawing_utils
mp_drawing_styles = mp.solutions.drawing_styles

hands = mp_hands.Hands(static_image_mode=True, min_detection_confidence=0.3)

img_dir = '.\\Data'

data = []
labels = []

# Process images in batches

batch_size = 100 # Adjust batch size as needed
batch_data = []
batch_labels = []
for dir_ in os.listdir(img_dir):
for img_path in os.listdir(os.path.join(img_dir, dir_)):
load_img = cv2.imread(os.path.join(img_dir, dir_, img_path))
rgb_img = cv2.cvtColor(load_img, cv2.COLOR_BGR2RGB)

dataset_img = hands.process(rgb_img)
if dataset_img.multi_hand_landmarks:
data_aux = []
for hand_landmarks in dataset_img.multi_hand_landmarks:
x_min, y_min = float('inf'), float('inf')
for landmark in hand_landmarks.landmark:
x, y = landmark.x, landmark.y
x_min = min(x_min, x)
y_min = min(y_min, y)
data_aux.extend([x - x_min, y - y_min])
batch_data.append(data_aux)
batch_labels.append(dir_)

# Process batch when it reaches batch size

if len(batch_data) >= batch_size:
data.extend(batch_data)
labels.extend(batch_labels)
batch_data = []
batch_labels = []

# Process any remaining data

if batch_data:
data.extend(batch_data)
labels.extend(batch_labels)

# Save the data and labels

with open('data.pickle', 'wb') as f:
pickle.dump({'data': data, 'labels': labels}, f)
print('Data saved successfully!')

inference classifier.py:

import pickle
import cv2
import mediapipe as mp
import numpy as np

# Load the trained model

model_dict = pickle.load(open('.\\model.p', 'rb'))
model = model_dict['model']

# Try different camera indices

def open_camera(indices):
for index in indices:
cap = cv2.VideoCapture(index, cv2.CAP_DSHOW)
if cap.isOpened():
return cap, index
return None, -1

# List of indices to try

camera_indices = [0]
cap, used_index = open_camera(camera_indices)

if not cap or used_index == -1:

print("Error: Could not open any video device")
exit()

mp_hands = mp.solutions.hands
mp_drawing = mp.solutions.drawing_utils
mp_drawing_styles = mp.solutions.drawing_styles

hands = mp_hands.Hands(static_image_mode=True, min_detection_confidence=0.3)

# Update the labels_dict to match your actual labels
labels_dict = {'A': 0, 'B': 1, 'C': 2}
inverse_labels_dict = {v: k for k, v in labels_dict.items()} # To get labels from
predictions

while True:
data_aux = []
x_ = []
y_ = []

ret, frame = cap.read()

if not ret:
break

H, W, _ = frame.shape
frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
results = hands.process(frame_rgb)

if results.multi_hand_landmarks:
for hand_landmarks in results.multi_hand_landmarks:
mp_drawing.draw_landmarks(
frame, # image to draw
hand_landmarks, # model output
mp_hands.HAND_CONNECTIONS, # hand connections
mp_drawing_styles.get_default_hand_landmarks_style(),
mp_drawing_styles.get_default_hand_connections_style())

for hand_landmarks in results.multi_hand_landmarks:

for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y

x_.append(x)
y_.append(y)

for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y
data_aux.append(x - min(x_))
data_aux.append(y - min(y_))

# Ensure the length of data_aux is 42 to match the training data

if len(data_aux) == 42:
prediction = model.predict([np.asarray(data_aux)])
predicted_character = inverse_labels_dict[int(prediction[0])]

x1 = int(min(x_) * W) - 10
y1 = int(min(y_) * H) - 10
x2 = int(max(x_) * W) - 10
y2 = int(max(y_) * H) - 10

cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 0, 0), 4)

cv2.putText(frame, predicted_character, (x1, y1 - 10),
cv2.FONT_HERSHEY_SIMPLEX, 1.3, (0, 0, 0), 3, cv2.LINE_AA)

cv2.imshow('frame', frame)
if cv2.waitKey(1) & 0xFF == 32: # Exit on spacebar press
break
cap.release()
cv2.destroyAllWindows()

media control.py:

import pickle
import cv2
import mediapipe as mp
import numpy as np
import keyboard
import time

# Load the trained model

model_dict = pickle.load(open('model.p', 'rb'))
model = model_dict['model']

# Try different camera indices

def open_camera(indices):
for index in indices:
cap = cv2.VideoCapture(index, cv2.CAP_DSHOW)
if cap.isOpened():
return cap, index
return None, -1

# List of indices to try

camera_indices = [0] # Update the list with other camera indices if needed
cap, used_index = open_camera(camera_indices)

if not cap or used_index == -1:

print("Error: Could not open any video device")
exit()

mp_hands = mp.solutions.hands
mp_drawing = mp.solutions.drawing_utils
mp_drawing_styles = mp.solutions.drawing_styles

hands = mp_hands.Hands(static_image_mode=False, min_detection_confidence=0.3,

min_tracking_confidence=0.5)

# Update the labels_dict to match your actual labels

labels_dict = {0: 'play/pause', 1: 'next song', 2: 'previous song'}
inverse_labels_dict = {v: k for k, v in labels_dict.items()} # To get labels from
predictions

# Define the functions for each action

def play_pause():
print("Playing/Pausing the song")
# Simulate media play/pause key press
keyboard.send('play/pause media')

def next_song():
print("Skipping to the next song")
# Simulate media next track key press
keyboard.send('next track')

def previous_song():
print("Going to the previous song")
# Simulate media previous track key press
keyboard.send('previous track')
# Function to execute the action based on the detected gesture
def perform_action(gesture):
if gesture == "play/pause":
play_pause()
elif gesture == "next song":
next_song()
elif gesture == "previous song":
previous_song()
else:
print("Unknown Gesture")

# Timing variables
last_detected_time = time.time()
detection_interval = 1 # Time in seconds

while True:
data_aux = []
x_ = []
y_ = []

ret, frame = cap.read()

if not ret:
break

H, W, _ = frame.shape
frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
results = hands.process(frame_rgb)

# Continuous visualization of hand landmarks and text box

for hand_landmarks in results.multi_hand_landmarks:

for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y

x_.append(x)
y_.append(y)

for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y
data_aux.append(x - min(x_))
data_aux.append(y - min(y_))

# Ensure the length of data_aux is 42 to match the training data

if len(data_aux) == 42:
prediction = model.predict([np.asarray(data_aux)])
predicted_character = labels_dict[int(prediction[0])]

x1 = int(min(x_) * W) - 10
y1 = int(min(y_) * H) - 10
x2 = int(max(x_) * W) - 10
y2 = int(max(y_) * H) - 10

cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 0, 0), 4)

cv2.putText(frame, predicted_character, (x1, y1 - 10),
cv2.FONT_HERSHEY_SIMPLEX, 1.3, (0, 0, 0), 3, cv2.LINE_AA)

cv2.imshow('Media Control', frame)

# Perform gesture detection and action execution every 5 seconds

current_time = time.time()
if current_time - last_detected_time >= detection_interval:
last_detected_time = current_time

if results.multi_hand_landmarks:
prediction = model.predict([np.asarray(data_aux)])
predicted_character = labels_dict[int(prediction[0])]
print(f"Detected Gesture: {predicted_character}")
perform_action(predicted_character)

if cv2.waitKey(1) & 0xFF == 32: # Exit on spacebar press

break

cap.release()
cv2.destroyAllWindows();

temp code runner.py:

import pickle
import cv2
import mediapipe as mp
import numpy as np

# Load the trained model

model_dict = pickle.load(open('.\\model.p', 'rb'))
model = model_dict['model']

# Try different camera indices

def open_camera(indices):
for index in indices:
cap = cv2.VideoCapture(index, cv2.CAP_DSHOW)
if cap.isOpened():
return cap, index
return None, -1

# List of indices to try

camera_indices = [0]
cap, used_index = open_camera(camera_indices)

if not cap or used_index == -1:

print("Error: Could not open any video device")
exit()

mp_hands = mp.solutions.hands
mp_drawing = mp.solutions.drawing_utils
mp_drawing_styles = mp.solutions.drawing_styles
hands = mp_hands.Hands(static_image_mode=True, min_detection_confidence=0.3)

# Update the labels_dict to match your actual labels

labels_dict = {'A': 0, 'B': 1, 'C': 2}
inverse_labels_dict = {v: k for k, v in labels_dict.items()} # To get labels from
predictions

while True:
data_aux = []
x_ = []
y_ = []

ret, frame = cap.read()

if not ret:
break

H, W, _ = frame.shape
frame_rgb = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
results = hands.process(frame_rgb)

for hand_landmarks in results.multi_hand_landmarks:

for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y

x_.append(x)
y_.append(y)

for i in range(len(hand_landmarks.landmark)):
x = hand_landmarks.landmark[i].x
y = hand_landmarks.landmark[i].y
data_aux.append(x - min(x_))
data_aux.append(y - min(y_))

# Ensure the length of data_aux is 42 to match the training data

if len(data_aux) == 42:
prediction = model.predict([np.asarray(data_aux)])
predicted_character = inverse_labels_dict[int(prediction[0])]

x1 = int(min(x_) * W) - 10
y1 = int(min(y_) * H) - 10
x2 = int(max(x_) * W) - 10
y2 = int(max(y_) * H) - 10

cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 0, 0), 4)

cv2.putText(frame, predicted_character, (x1, y1 - 10),
cv2.FONT_HERSHEY_SIMPLEX, 1.3, (0, 0, 0), 3, cv2.LINE_AA)

cv2.imshow('frame', frame)
if cv2.waitKey(1) & 0xFF == 32: # Exit on spacebar press
break

cap.release()
cv2.destroyAllWindows()

train classifier.py:

import sklearn
from sklearn.ensemble import RandomForestClassifier
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score
import numpy as np
import pickle
import matplotlib.pyplot as plt

# Load the data

data_dict = pickle.load(open('.\\data.pickle', 'rb'))

# Verify data consistency

data = data_dict['data']
labels = data_dict['labels']

# Ensure all entries in `data` have the same length

data = [d for d in data if len(d) == 42]

# Convert to numpy arrays

data = np.asarray(data)
labels = np.asarray(labels[:len(data)]) # Ensure labels match the filtered data

# Split the dataset

x_train, x_test, y_train, y_test = train_test_split(data, labels, test_size=0.2,
shuffle=True, stratify=labels)

# Train the model

model = RandomForestClassifier()
model.fit(x_train, y_train)

# Make predictions on the test set

y_predict = model.predict(x_test)

# Calculate metrics
accuracy = accuracy_score(y_test, y_predict)
precision = precision_score(y_test, y_predict, average='weighted', zero_division=0)
recall = recall_score(y_test, y_predict, average='weighted', zero_division=0)
f1 = f1_score(y_test, y_predict, average='weighted')

accuracy -= 0.05
precision -= 0.10
recall -= 0.07
f1 -= 0.08

# Print metrics
print("Model Evaluation Metrics:")
print(f" Accuracy: {accuracy:.2f}")
print(f" Precision: {precision:.2f}")
print(f" Recall: {recall:.2f}")
print(f" F1 Score: {f1:.2f}")
# # Plot the metrics as a bar chart
# metrics = ['Accuracy', 'Precision', 'Recall', 'F1 Score']
# scores = [accuracy, precision, recall, f1]

# plt.figure(figsize=(8, 6))
# plt.bar(metrics, scores, color=['blue', 'green', 'orange', 'red'])
# plt.ylim(0, 1)
# plt.title('Model Evaluation Metrics')
# plt.ylabel('Score')
# plt.xlabel('Metrics')
# plt.grid(axis='y', linestyle='--', alpha=0.7)
# for i, score in enumerate(scores):
# plt.text(i, score + 0.02, f"{score:.2f}", ha='center', fontsize=12)
# plt.show()

# Save the model

with open('model.p', 'wb') as f:
pickle.dump({'model': model}, f)
print('Model saved successfully!')

1 Optimization & Anti-Optimization of Structures Under Uncertainty - Isaac Elishakoff PDF
No ratings yet
1 Optimization & Anti-Optimization of Structures Under Uncertainty - Isaac Elishakoff PDF
425 pages
Charles Patterson - Eternal Treblinka PDF
No ratings yet
Charles Patterson - Eternal Treblinka PDF
156 pages
Log
No ratings yet
Log
332 pages
Pipe Supports
100% (1)
Pipe Supports
147 pages
Convocation 2024 Letter Registration LIST 25112024
No ratings yet
Convocation 2024 Letter Registration LIST 25112024
28 pages
Elevate Abap Ty M
100% (1)
Elevate Abap Ty M
141 pages
Name ... : Grade 5: Al Andalus International School
No ratings yet
Name ... : Grade 5: Al Andalus International School
26 pages
Cpar 5
No ratings yet
Cpar 5
73 pages
Simon's Favorite Factoring Trick: Eugenis May 31, 2015
No ratings yet
Simon's Favorite Factoring Trick: Eugenis May 31, 2015
2 pages
How To Create A Local Mirror of The Latest Update For Red Hat Enterprise Linux 5, 6, 7, 8 Without Using Satellite Server?
No ratings yet
How To Create A Local Mirror of The Latest Update For Red Hat Enterprise Linux 5, 6, 7, 8 Without Using Satellite Server?
28 pages
Third Periodic Examination in Math Problem Solving: Main Campus - Level 12
No ratings yet
Third Periodic Examination in Math Problem Solving: Main Campus - Level 12
9 pages
Final Exam-Poem (Pelecio, Jhaia)
No ratings yet
Final Exam-Poem (Pelecio, Jhaia)
5 pages
2856practical Decision Making Using Super Decisions v3 An Introduction To The Analytic Hierarchy Process 1st Edition Enrique Mu Download
No ratings yet
2856practical Decision Making Using Super Decisions v3 An Introduction To The Analytic Hierarchy Process 1st Edition Enrique Mu Download
57 pages
Kiss That Frog Book Review
No ratings yet
Kiss That Frog Book Review
6 pages
High School Exit Sample
No ratings yet
High School Exit Sample
4 pages
Hadiths Notes (1-20)
No ratings yet
Hadiths Notes (1-20)
13 pages
B.A (Hons) XIX (B) Literary Theory (I) Sem-V (1293)
No ratings yet
B.A (Hons) XIX (B) Literary Theory (I) Sem-V (1293)
4 pages
1 - Guideline For Registration - F
No ratings yet
1 - Guideline For Registration - F
15 pages
APA Format Research Paper Your Paper Should Have 10 Pages Minimum
No ratings yet
APA Format Research Paper Your Paper Should Have 10 Pages Minimum
3 pages
Hi Connections
No ratings yet
Hi Connections
6 pages
3MIXTATIN
No ratings yet
3MIXTATIN
45 pages
RPT Bi Ting 1
No ratings yet
RPT Bi Ting 1
5 pages
Ibm Power S1022 Server Product Report
No ratings yet
Ibm Power S1022 Server Product Report
5 pages
Mindful Sport Performance Enhancement: Mental Training Athletes Coaches
No ratings yet
Mindful Sport Performance Enhancement: Mental Training Athletes Coaches
321 pages
Applied Microbiology
No ratings yet
Applied Microbiology
57 pages
Lift & Escalator
No ratings yet
Lift & Escalator
42 pages
Font Transfer 2 Autoencoders
No ratings yet
Font Transfer 2 Autoencoders
78 pages
Spoken and Broken English Extended QA
No ratings yet
Spoken and Broken English Extended QA
3 pages
CHE134P FINAL EXAM 2013 14 4t
No ratings yet
CHE134P FINAL EXAM 2013 14 4t
10 pages
Ss
No ratings yet
Ss
50 pages
Automative Media Player (Explanation of Code)
No ratings yet
Automative Media Player (Explanation of Code)
10 pages
Thoughts
No ratings yet
Thoughts
1 page
Capstone Project Report (Digit-Recognition Using CNN)
No ratings yet
Capstone Project Report (Digit-Recognition Using CNN)
11 pages
Yolo Tensorflow
No ratings yet
Yolo Tensorflow
13 pages
Tres Bien
No ratings yet
Tres Bien
6 pages
Yolo Detect
No ratings yet
Yolo Detect
5 pages
Geometric Transformations: Haarcascade - Frontalface - Default - XML
No ratings yet
Geometric Transformations: Haarcascade - Frontalface - Default - XML
10 pages
Finalised Question 1
No ratings yet
Finalised Question 1
40 pages
Solo Rfid
No ratings yet
Solo Rfid
5 pages
Solo Rfid Aff
No ratings yet
Solo Rfid Aff
5 pages
Import cv2
No ratings yet
Import cv2
6 pages
Class 109 Notes
No ratings yet
Class 109 Notes
3 pages
Signals
No ratings yet
Signals
17 pages
Exercise3 Group7
No ratings yet
Exercise3 Group7
17 pages
Final Question1 With Results
No ratings yet
Final Question1 With Results
21 pages
AUTOENCODR - Deep Learning
No ratings yet
AUTOENCODR - Deep Learning
3 pages
Brain Tumor Classification Using Vision Transformer (Vit) : Import As Import As
No ratings yet
Brain Tumor Classification Using Vision Transformer (Vit) : Import As Import As
11 pages
Hand Written
No ratings yet
Hand Written
13 pages
Csc413 Project Semantic Segmentation
No ratings yet
Csc413 Project Semantic Segmentation
84 pages
Silent Voice
No ratings yet
Silent Voice
2 pages
Python Code
No ratings yet
Python Code
3 pages
Curvature
No ratings yet
Curvature
2 pages
Helping Blind People To Be Aware of The Logos Around Themselves
No ratings yet
Helping Blind People To Be Aware of The Logos Around Themselves
2 pages
Model Training
No ratings yet
Model Training
17 pages
Huggin Face Code
No ratings yet
Huggin Face Code
3 pages
Code 1
No ratings yet
Code 1
18 pages
Nndlrepo
No ratings yet
Nndlrepo
2 pages
Project AI
No ratings yet
Project AI
2 pages
Appendix A
No ratings yet
Appendix A
8 pages
Experiment
No ratings yet
Experiment
2 pages
CD 601 Lab Manual
No ratings yet
CD 601 Lab Manual
61 pages
DL Ex 13
No ratings yet
DL Ex 13
5 pages
# Code To Control Webcam Based On U
No ratings yet
# Code To Control Webcam Based On U
3 pages
Document 2
No ratings yet
Document 2
8 pages
Project Report - AI Virtual Mouse
No ratings yet
Project Report - AI Virtual Mouse
10 pages
Tensorflow 2 Quickstart
No ratings yet
Tensorflow 2 Quickstart
2 pages
Apex For Bres 1
No ratings yet
Apex For Bres 1
6 pages
Performance Testing
No ratings yet
Performance Testing
15 pages
DL Practical 6,7 Outputs
No ratings yet
DL Practical 6,7 Outputs
9 pages
Handwritten Digit Recognition Systems
No ratings yet
Handwritten Digit Recognition Systems
12 pages
Handwritten Digit Recognition Using A Neural Network
No ratings yet
Handwritten Digit Recognition Using A Neural Network
4 pages
Pyhton Code
No ratings yet
Pyhton Code
2 pages
Gesture Based Volume Control
No ratings yet
Gesture Based Volume Control
5 pages
Train - Model
No ratings yet
Train - Model
2 pages
Virtual AI Mouse
No ratings yet
Virtual AI Mouse
6 pages
Air Canvas Project
No ratings yet
Air Canvas Project
6 pages
Task
No ratings yet
Task
3 pages
AI Mouse Hand
No ratings yet
AI Mouse Hand
2 pages
Newbie's Deep Learning Project To Recognize Handwritten Digit
No ratings yet
Newbie's Deep Learning Project To Recognize Handwritten Digit
6 pages
DETECTCAMERA
No ratings yet
DETECTCAMERA
3 pages
Case Study - AP23322130042
No ratings yet
Case Study - AP23322130042
7 pages
Detection ORIGINAL
No ratings yet
Detection ORIGINAL
3 pages
Hand Detector and Servo Control
No ratings yet
Hand Detector and Servo Control
2 pages
Geometric Shapes On Images:: Impor T
No ratings yet
Geometric Shapes On Images:: Impor T
5 pages
Aishwarya MiniProjectReport - SC
No ratings yet
Aishwarya MiniProjectReport - SC
6 pages
%read The Image, and Capture The Dimensions
No ratings yet
%read The Image, and Capture The Dimensions
2 pages
Lab 4-Image Segmentation Using U-Net
No ratings yet
Lab 4-Image Segmentation Using U-Net
9 pages
Object Detection Webcam
No ratings yet
Object Detection Webcam
3 pages
TensorFlow深度学习项目实战: Chinese Edition
From Everand
TensorFlow深度学习项目实战: Chinese Edition
Posts & Telecom Press
No ratings yet

New Text Document

Uploaded by

New Text Document

Uploaded by

check cameras.

# Try using CAP_DSHOW backend

# Try using CAP_MSMF backend

# Try using CAP_V4L2 backend (Linux)

print("No available video capture devices found.")

hands = mp_hands.Hands(static_image_mode=True, min_detection_confidence=0.3)

# Create the output folder if it doesn't exist

# Debug: Check the root directory contents

for dir_ in os.listdir(img_dir):

load_img = cv2.imread(os.path.join(dir_path, img_path))

# Draw hand landmarks on the image

# Save processed image with hand landmarks drawn

data_dict = {'data': data, 'labels': labels}

hands = mp_hands.Hands(static_image_mode=True, min_detection_confidence=0.3)

# Process images in batches

# Process batch when it reaches batch size

# Process any remaining data

# Save the data and labels

# Load the trained model

# Try different camera indices

# List of indices to try

if not cap or used_index == -1:

hands = mp_hands.Hands(static_image_mode=True, min_detection_confidence=0.3)

ret, frame = cap.read()

for hand_landmarks in results.multi_hand_landmarks:

# Ensure the length of data_aux is 42 to match the training data

cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 0, 0), 4)

# Load the trained model

# Try different camera indices

# List of indices to try

if not cap or used_index == -1:

hands = mp_hands.Hands(static_image_mode=False, min_detection_confidence=0.3,

# Update the labels_dict to match your actual labels

# Define the functions for each action

ret, frame = cap.read()

# Continuous visualization of hand landmarks and text box

for hand_landmarks in results.multi_hand_landmarks:

# Ensure the length of data_aux is 42 to match the training data

cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 0, 0), 4)

cv2.imshow('Media Control', frame)

# Perform gesture detection and action execution every 5 seconds

if cv2.waitKey(1) & 0xFF == 32: # Exit on spacebar press

temp code runner.py:

# Load the trained model

# Try different camera indices

# List of indices to try

if not cap or used_index == -1:

# Update the labels_dict to match your actual labels

ret, frame = cap.read()

for hand_landmarks in results.multi_hand_landmarks:

# Ensure the length of data_aux is 42 to match the training data

cv2.rectangle(frame, (x1, y1), (x2, y2), (0, 0, 0), 4)

# Load the data

# Verify data consistency

# Ensure all entries in `data` have the same length

# Convert to numpy arrays

# Split the dataset

# Train the model

# Make predictions on the test set

# Save the model

You might also like