Ass 8

The document loads and preprocesses a speech commands dataset to extract MFCC features, splits the data into train, validation and test sets, defines an LSTM model, trains and evaluates the model, and provides a function to make predictions on new audio samples.

Uploaded by

Taqwa Elsayed

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

33 views2 pages

Ass 8

Uploaded by

Taqwa Elsayed

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 2

import os

import numpy as np
import tensorflow as tf
from tensorflow.keras import layers, Model
from sklearn.model_selection import train_test_split
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.losses import SparseCategoricalCrossentropy

# Download and unzip the dataset

!wget
https://storage.googleapis.com/download.tensorflow.org/data/mini_speech_commands.zi
p
!unzip mini_speech_commands.zip

# Define constants
DATA_DIR = "mini_speech_commands"
LABELS = np.array(os.listdir(DATA_DIR))
NUM_CLASSES = len(LABELS)
SAMPLE_RATE = 16000
MFCC_MAX_LEN = 40
BATCH_SIZE = 32
EPOCHS = 10
VAL_SPLIT = 0.2

# Function to load and preprocess audio files

def preprocess_data():
labels = []
mfccs = []
for label in LABELS:
if label == "_background_noise_":
continue
label_dir = os.path.join(DATA_DIR, label)
for filename in os.listdir(label_dir):
filepath = os.path.join(label_dir, filename)
audio, _ = tf.audio.decode_wav(tf.io.read_file(filepath),
desired_channels=1)
audio = tf.squeeze(audio, axis=-1)
# Compute MFCC
mfcc =
tf.signal.mfccs_from_log_mel_spectrograms(tf.expand_dims(tf.expand_dims(audio,
axis=0), axis=-1), n_mfcc=MFCC_MAX_LEN)
mfccs.append(mfcc)
labels.append(label)
return np.array(mfccs), np.array(labels)

# Load and preprocess the data

mfccs, labels = preprocess_data()

# Convert labels to indices

label_to_index = {label: i for i, label in enumerate(LABELS)}
indices = np.array([label_to_index[label] for label in labels])

# Split the dataset into train, validation, and test sets

X_train, X_test, y_train, y_test = train_test_split(mfccs, indices, test_size=0.2,
random_state=42)
X_train, X_val, y_train, y_val = train_test_split(X_train, y_train, test_size=0.2,
random_state=42)

# Define LSTM model

class LSTMModel(Model):
def __init__(self, num_classes):
super(LSTMModel, self).__init__()
self.lstm = layers.LSTM(128)
self.dense = layers.Dense(num_classes, activation='softmax')

def call(self, inputs):

x = self.lstm(inputs)
x = self.dense(x)
return x

# Instantiate the model

model = LSTMModel(num_classes=NUM_CLASSES)

# Compile the model

model.compile(optimizer=Adam(), loss=SparseCategoricalCrossentropy(),
metrics=['accuracy'])

# Train the model

history = model.fit(X_train, y_train, batch_size=BATCH_SIZE, epochs=EPOCHS,
validation_data=(X_val, y_val))

# Evaluate the model

test_loss, test_accuracy = model.evaluate(X_test, y_test)
print("Test Loss:", test_loss)
print("Test Accuracy:", test_accuracy)

# Inference on new audio samples

def predict_audio(audio):
# Compute MFCC
mfcc =
tf.signal.mfccs_from_log_mel_spectrograms(tf.expand_dims(tf.expand_dims(audio,
axis=0), axis=-1), n_mfcc=MFCC_MAX_LEN)
prediction = model.predict(mfcc)
predicted_label_index = np.argmax(prediction)
predicted_label = LABELS[predicted_label_index]
return predicted_label

# Example usage for inference

# audio_sample = load_audio("path_to_audio_file")
# predicted_label = predict_audio(audio_sample)
# print("Predicted Label:", predicted_label)

Rebel-9 Manual v1.0
No ratings yet
Rebel-9 Manual v1.0
121 pages
Ass
No ratings yet
Ass
5 pages
Flow Chart:: Input Audio Preprocessing
No ratings yet
Flow Chart:: Input Audio Preprocessing
14 pages
Finetuning
No ratings yet
Finetuning
10 pages
Emonet
No ratings yet
Emonet
16 pages
Guide To YAMNet - Sound Event Classifier
No ratings yet
Guide To YAMNet - Sound Event Classifier
10 pages
Ex 7
No ratings yet
Ex 7
2 pages
ATI Ipynb
No ratings yet
ATI Ipynb
12 pages
DL
No ratings yet
DL
17 pages
Audio GAN
No ratings yet
Audio GAN
2 pages
Project Report - 092046
No ratings yet
Project Report - 092046
5 pages
DL 6
No ratings yet
DL 6
5 pages
Import As From Import From Import From Import From Import: # Load The IMDB Dataset
No ratings yet
Import As From Import From Import From Import From Import: # Load The IMDB Dataset
6 pages
DL Print Final
No ratings yet
DL Print Final
36 pages
MLSP Course Project Report
No ratings yet
MLSP Course Project Report
2 pages
CNN Lab Manual
No ratings yet
CNN Lab Manual
29 pages
Distinguishing Between Two Human Voices Using AI
No ratings yet
Distinguishing Between Two Human Voices Using AI
11 pages
DL 5 Excuted
No ratings yet
DL 5 Excuted
13 pages
DL 6th Exp Program
No ratings yet
DL 6th Exp Program
3 pages
Codefp 1
No ratings yet
Codefp 1
15 pages
EncoderDecoderSeq2Seq DeepLSTM
No ratings yet
EncoderDecoderSeq2Seq DeepLSTM
7 pages
Deep Learning Lab
No ratings yet
Deep Learning Lab
20 pages
Assignment 3
No ratings yet
Assignment 3
25 pages
DL Exps
No ratings yet
DL Exps
9 pages
DLTF Lab Manual.1
No ratings yet
DLTF Lab Manual.1
29 pages
Exp. No.: I. Aim: AIML634P Neural Network Lab 2262034
No ratings yet
Exp. No.: I. Aim: AIML634P Neural Network Lab 2262034
6 pages
DL 22Q71A4206
No ratings yet
DL 22Q71A4206
65 pages
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
No ratings yet
566f0619-9145-4b8f-b12b-cb8a5b0cd30d
17 pages
Code For Ser
No ratings yet
Code For Ser
3 pages
DL Lab Answers Batch 2
No ratings yet
DL Lab Answers Batch 2
27 pages
DL Lab Manual
No ratings yet
DL Lab Manual
18 pages
DL 8
No ratings yet
DL 8
4 pages
DL 3
No ratings yet
DL 3
6 pages
Movie Review Classification
No ratings yet
Movie Review Classification
5 pages
Update On Speech Recognition System Using LibriSpeech
No ratings yet
Update On Speech Recognition System Using LibriSpeech
3 pages
Speech Command Recognition Using Deep Learning
No ratings yet
Speech Command Recognition Using Deep Learning
25 pages
Practical No11
No ratings yet
Practical No11
6 pages
ADL Exp File
No ratings yet
ADL Exp File
56 pages
Advanced Deep Learning Practical File
No ratings yet
Advanced Deep Learning Practical File
29 pages
Latihan UAP
No ratings yet
Latihan UAP
3 pages
Emotion Tagging in An Audio Signal Using Weakly Supervised Learning
No ratings yet
Emotion Tagging in An Audio Signal Using Weakly Supervised Learning
46 pages
Speech Emotion Recognition From Raw Audio Using Deep Learning
No ratings yet
Speech Emotion Recognition From Raw Audio Using Deep Learning
83 pages
Vocoder Summer School 2021
No ratings yet
Vocoder Summer School 2021
298 pages
MLSP Lab Exp3
No ratings yet
MLSP Lab Exp3
6 pages
MusicVAE - Explanation
No ratings yet
MusicVAE - Explanation
20 pages
Voice Emotion Recognition
No ratings yet
Voice Emotion Recognition
11 pages
Siamese Network Assignment
No ratings yet
Siamese Network Assignment
3 pages
LSTM Flow
No ratings yet
LSTM Flow
3 pages
Jamming Detection
No ratings yet
Jamming Detection
29 pages
DL - 5 Excuted
No ratings yet
DL - 5 Excuted
13 pages
Deep Learning Lab Practicals
No ratings yet
Deep Learning Lab Practicals
24 pages
ML PPT G3
No ratings yet
ML PPT G3
15 pages
Multi Layer Perceptron Tf2 Code Description
No ratings yet
Multi Layer Perceptron Tf2 Code Description
10 pages
Assignment 7
No ratings yet
Assignment 7
10 pages
ML Assignment
No ratings yet
ML Assignment
10 pages
RBPRATYUSH448
No ratings yet
RBPRATYUSH448
20 pages
Breaking Down The Mix - Using Python and Neural Networks To Separate Audio Tracks - by John MicMico - Artificial Intelligence in Plain English
No ratings yet
Breaking Down The Mix - Using Python and Neural Networks To Separate Audio Tracks - by John MicMico - Artificial Intelligence in Plain English
9 pages
Exp 8 Machine Translation
No ratings yet
Exp 8 Machine Translation
11 pages
Working of Sentimental Analysis
No ratings yet
Working of Sentimental Analysis
3 pages
JazzSolo LSTM
No ratings yet
JazzSolo LSTM
32 pages
CS 322 - Computer Organization Lecture 5 & 6
No ratings yet
CS 322 - Computer Organization Lecture 5 & 6
55 pages
Webhook
No ratings yet
Webhook
2 pages
EC2 Pricing Options
No ratings yet
EC2 Pricing Options
6 pages
EC2 Pricing
No ratings yet
EC2 Pricing
37 pages
CAF (Cloud Adoption Framework) in AWS AWS Cloud Adoption Framework (CAF)
No ratings yet
CAF (Cloud Adoption Framework) in AWS AWS Cloud Adoption Framework (CAF)
5 pages
Aws Certified Cloud Practitioner - 9
100% (1)
Aws Certified Cloud Practitioner - 9
28 pages
Sheet 1
No ratings yet
Sheet 1
7 pages
Project 1
No ratings yet
Project 1
30 pages
UNIT 03 - Electrochemistry
No ratings yet
UNIT 03 - Electrochemistry
10 pages
Grafik Kalkulator
No ratings yet
Grafik Kalkulator
2 pages
Short Notes On Servo Motor
100% (3)
Short Notes On Servo Motor
2 pages
Softening Behavior of Reinforced Concrete Beams Under Cyclic Loading
No ratings yet
Softening Behavior of Reinforced Concrete Beams Under Cyclic Loading
24 pages
Grinding System and Circuit of VRM Process Data Plant Data
67% (6)
Grinding System and Circuit of VRM Process Data Plant Data
58 pages
RES320 - Preisinger, Carrie FINAL EXAM
100% (1)
RES320 - Preisinger, Carrie FINAL EXAM
5 pages
EMT Handout
No ratings yet
EMT Handout
2 pages
GM Screen Daggerheart - Portrait
No ratings yet
GM Screen Daggerheart - Portrait
4 pages
Introduction To Computer Fundamentals
No ratings yet
Introduction To Computer Fundamentals
15 pages
Beamon's Model
No ratings yet
Beamon's Model
5 pages
Pick&Place Station Assembly Instructions
No ratings yet
Pick&Place Station Assembly Instructions
20 pages
FT-891 Quick Manual: (PWR/LOCK) Key RF/SQL Knob
No ratings yet
FT-891 Quick Manual: (PWR/LOCK) Key RF/SQL Knob
2 pages
II Sem Syllabus
No ratings yet
II Sem Syllabus
12 pages
W73153 International GCSE Science (Single Award) 4SS0 AN Accessible Version
No ratings yet
W73153 International GCSE Science (Single Award) 4SS0 AN Accessible Version
4 pages
Fabric Drape
No ratings yet
Fabric Drape
3 pages
Digital Signal Processing: Dr. Saad Muhi Falih
No ratings yet
Digital Signal Processing: Dr. Saad Muhi Falih
15 pages
Insertion Sort Algorithm and Complexity Analysis
No ratings yet
Insertion Sort Algorithm and Complexity Analysis
1 page
Unit Conversion Table: Distance Foot (FT) Inch (In) Meter (M) Centimeter (CM) Mile (Mi)
No ratings yet
Unit Conversion Table: Distance Foot (FT) Inch (In) Meter (M) Centimeter (CM) Mile (Mi)
2 pages
Project Report
100% (1)
Project Report
58 pages
Comparative Analysis of Water and Oil Media On Temperature Stability in PID Control-Based Digital Thermometer Calibrator
No ratings yet
Comparative Analysis of Water and Oil Media On Temperature Stability in PID Control-Based Digital Thermometer Calibrator
6 pages
Modelling Imperfectly Appropriable R&D Via Spillovers
No ratings yet
Modelling Imperfectly Appropriable R&D Via Spillovers
20 pages
Rt6-Xxx: Telecontrolli
No ratings yet
Rt6-Xxx: Telecontrolli
2 pages
PrecisionTree - Debbie House
No ratings yet
PrecisionTree - Debbie House
18 pages
What Are The Differences Between IE1-IE4
No ratings yet
What Are The Differences Between IE1-IE4
2 pages
28 Semiconductors Formula Sheets Quizrr
No ratings yet
28 Semiconductors Formula Sheets Quizrr
7 pages
Computer and Communication Networks Lab Manual (Lab 4) : Topic: Wireshark TCP Packets
No ratings yet
Computer and Communication Networks Lab Manual (Lab 4) : Topic: Wireshark TCP Packets
7 pages
BSC Aeronautical
No ratings yet
BSC Aeronautical
144 pages
Design of Rotation Inducing Rocket Fins and Their Analysis For Aerodynamic Stability
No ratings yet
Design of Rotation Inducing Rocket Fins and Their Analysis For Aerodynamic Stability
6 pages
Software Requirement Analysis AND Estimation Unit - 3
No ratings yet
Software Requirement Analysis AND Estimation Unit - 3
40 pages