0% found this document useful (0 votes)

33 views4 pages

Deepfilternet

The document outlines the process for running DeepFilterNet to analyze Telugu audio for clarity and filler words. It includes steps for logging into Hugging Face, downloading the model, installing necessary packages, and executing the main script to measure audio noisiness and detect fillers. The script utilizes various libraries to enhance audio quality, translate filler words, and recognize speech, ultimately providing insights into the clarity of the audio and the frequency of filler usage.

Uploaded by

oggu.bhargavi

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as ODT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

33 views4 pages

Deepfilternet

Uploaded by

oggu.bhargavi

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as ODT, PDF, TXT or read online on Scribd

You are on page 1/ 4

DeepFilterNet

The below process is about running of deepfilternet display clear or not based on
noisy score and counting fillers in an telugu audio.

Step1: Login to huggingface in locally

!huggingface-cli login
give hugging face token to login successfully

Step2: download the model

!git clone https://huggingface.co/spaces/hshr/DeepFilterNet2

Step3:install the requirements.txt

!pip install -r /content/DeepFilterNet2/requirements.txt

Step4: install the required packages

!pip install torch torchaudio transformers
!pip install deepfilternet
!pip install googletrans==3.1.0a0
!pip install speechrecognition pydub
!apt-get install ffmpeg
!pip install transformers torchaudio librosa pydu
!pip install --upgrade googletrans==4.0.0-rc1 httpcore
!pip install torch torchaudio matplotlib SpeechRecognition googletrans==4.0.0-rc1 pydub

Step5:Run the main file

import torch
import torchaudio
import matplotlib.pyplot as plt
import speech_recognition as sr
from googletrans import Translator
from collections import Counter
from df.enhance import init_df, enhance
import time
from pydub import AudioSegment
from pydub.utils import make_chunks
import os

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

model, df, _ = init_df("/content/DeepFilterNet2/DeepFilterNet2",
config_allow_defaults=True)
model = model.to(device=device).eval()

def load_audio(file_path, sr=48000):

waveform, sr = torchaudio.load(file_path)
return waveform, sr

def measure_noisiness(audio_path, model, sr=48000, noise_threshold=0.5):

waveform, sr = load_audio(audio_path, sr)

if waveform.dim() > 1 and waveform.shape[0] > 1:

waveform = waveform.mean(dim=0, keepdim=True)
enhanced = enhance(model, df, waveform)

spectrogram = torchaudio.transforms.Spectrogram()(enhanced)
spectral_energy = torch.mean(spectrogram.pow(2), dim=0)
normalized_energy = spectral_energy / torch.max(spectral_energy)

noisy_frames = normalized_energy[normalized_energy > noise_threshold]

average_noisy_energy = torch.mean(noisy_frames).item()

return average_noisy_energy

def translate_text(text, src_lang, dest_lang, max_retries=3):

translator = Translator()
retries = 0
while retries < max_retries:
try:
translated = translator.translate(text, src=src_lang, dest=dest_lang)
return translated.text
except Exception as e:
print(f"Error translating '{text}': {e}")
retries += 1
time.sleep(1) # wait before retrying
return None

def segment_audio(audio_path, chunk_length_ms=60000):

audio = AudioSegment.from_file(audio_path)
chunks = make_chunks(audio, chunk_length_ms)
return chunks

def recognize_audio_chunk(chunk, recognizer, language="te-IN",

max_retries=3):
retries = 0
while retries < max_retries:
try:
with sr.AudioFile(chunk) as source:
audio_data = recognizer.record(source)
text = recognizer.recognize_google(audio_data, language=language)
return text
except sr.RequestError as e:
print(f"Recognition error: {e}")
retries += 1
time.sleep(1) # wait before retrying
except sr.UnknownValueError:
print("Speech Recognition could not understand audio")
return None
return None
def detect_fillers(audio_path, chunk_length_ms=60000):
english_fillers = ["alaaga", "inka", "ante", "alage", "antenti", "adi",
"abbo", "abba",
"lla", "ela", "avunu", "leda", "mari", "alāṇṭappuḍu", "poyindante",
"ainappaṭikī", "edo", "tappadu", "appuḍappuḍu", "sare"]

telugu_fillers = []
for filler in english_fillers:
translated_filler = translate_text(filler, 'en', 'te')
if translated_filler:
telugu_fillers.append(translated_filler)
else:
telugu_fillers.append(filler) # fallback to the original text

recognizer = sr.Recognizer()
audio_chunks = segment_audio(audio_path, chunk_length_ms)

text_segments = []
for i, chunk in enumerate(audio_chunks):
chunk_name = f"/tmp/chunk{i}.wav"
chunk.export(chunk_name, format="wav")
text = recognize_audio_chunk(chunk_name, recognizer)
if text:
text_segments.append(text)
os.remove(chunk_name) # Clean up temporary chunk file

full_text = " ".join(text_segments)

print("Recognized Text (Telugu):", full_text)

filler_count = Counter()

for telugu_filler, english_filler in zip(telugu_fillers, english_fillers):

count = full_text.count(telugu_filler)
if count > 0:
filler_count[english_filler] = count

for english_filler, count in filler_count.items():

print(f"Filler '{english_filler}' detected {count} times.")

total_fillers = sum(filler_count.values())
print(f"Total fillers detected: {total_fillers}")
audio_file = "/content/drive/MyDrive/input.wav"

# Measure noisy energy first

average_noisy_energy = measure_noisiness(audio_file, model)
print(f"Average Noisy Energy: {average_noisy_energy}")

if average_noisy_energy <= 0.75:

print("Audio is clear.")
else:
print("Audio is noisy.")
# Then detect fillers
detect_fillers(audio_file)

Output:2024-07-15 07:00:58 | INFO | DF | Loading model settings of

DeepFilterNet2 2024-07-15 07:00:58 | INFO | DF | Initializing model
`deepfilternet2` 2024-07-15 07:00:59 | INFO | DF | Found checkpoint
/content/DeepFilterNet2/DeepFilterNet2/checkpoints/model_96.ckpt.best with
epoch 96 2024-07-15 07:00:59 | INFO | DF | Running on device cpu 2024-07-15
07:00:59 | INFO | DF | Model loaded
Average Noisy Energy: 0.6249315142631531
Audio is clear.
Error translating 'alage': the JSON object must be str, bytes or bytearray,
not NoneType
Error translating 'antenti': the JSON object must be str, bytes or
bytearray, not NoneType
Error translating 'abba': the JSON object must be str, bytes or bytearray,
not NoneType Error translating 'lla': the JSON object must be str, bytes or
bytearray, not NoneType Error translating 'sare': the JSON object must be
str, bytes or bytearray, not NoneType Recognized Text (Telugu): పని ప్రతి
సినిమాకు ఒక ఎక్కడ ఉంది కదా సార్ ఊహలు గుసగుసలాడే కి ఓ జి జి ఎల్ అని పెట్టారు
అంత మంచిది అనిపిస్తుంది అప్పుడప్పుడు మీ సినిమాలు ఎందుకు పెట్టారు ఈ ఫిలిం గా
మన ఫిబ్రవరిలో అబ్బాయి అమ్మాయి కలిసి ఉన్నారు అందుకని ఎక్కువగా వాడుతూ ఉంటారు
అమ్మాయి చేతిలో పెట్టి అవును అవును చేశారు నాకు అవన్నీ సెకండ్ ఇయర్ అండి నాకు
అల్టిమేట్ మేటర్స్ ఇస్ అబ్బాయి అమ్మాయి మీద కూడా సెకండరీ ఇద్దరు మనుషులు అంతే
అండ్ వాళ్ళిద్దరూ ఒక లిస్టు పడినప్పుడు వాట్ ఆర్ ద ప్రాబ్లమ్స్ ప్రాబ్లమ్స్
కూడా కాదు ఆ ఇష్టం ఎందువల్ల దానికి ఏమి అడ్డు పడింది దాని వల్ల ఎలా చేయించారు
అనేది నాకు మెయిన్ బీర్ బాటిల్ ...................
Filler 'inka' detected 3 times.
Filler 'abba' detected 3 times.
Filler 'ela' detected 10 times.
Filler 'mari' detected 2 times.
Total fillers detected: 18

SQL Myanmar PDF
100% (8)
SQL Myanmar PDF
96 pages
NEXIV Tutorial en
No ratings yet
NEXIV Tutorial en
84 pages
Spoken Language Processing in Python Chapter2
No ratings yet
Spoken Language Processing in Python Chapter2
23 pages
Team17ReviewII 1
No ratings yet
Team17ReviewII 1
16 pages
Voice Assistant - Doge: Bachelor of Engineering IN Computer Science & Engineering
No ratings yet
Voice Assistant - Doge: Bachelor of Engineering IN Computer Science & Engineering
48 pages
Visual Graphics Design NC III CBC
67% (6)
Visual Graphics Design NC III CBC
103 pages
Video Processing Guii
No ratings yet
Video Processing Guii
5 pages
Speech Recognition
No ratings yet
Speech Recognition
5 pages
Telugu Script Achanta Hastie 2015.2805047
No ratings yet
Telugu Script Achanta Hastie 2015.2805047
32 pages
A Crypto Currency - Paper Presentation
100% (1)
A Crypto Currency - Paper Presentation
8 pages
Bachelor of Science in Computer Science
No ratings yet
Bachelor of Science in Computer Science
2 pages
Cloud Computing Resource Replication
No ratings yet
Cloud Computing Resource Replication
18 pages
ME3241E Cheat Sheet
No ratings yet
ME3241E Cheat Sheet
2 pages
Tecnomatix Plant Simulation Release Notes Version 9.0
No ratings yet
Tecnomatix Plant Simulation Release Notes Version 9.0
14 pages
RPA Interview Questions
100% (1)
RPA Interview Questions
2 pages
Implementation of Boolean Function Using 8:1 Multiplexer: Title of Project Report
No ratings yet
Implementation of Boolean Function Using 8:1 Multiplexer: Title of Project Report
15 pages
TP3-F WBS RevAM - v43
No ratings yet
TP3-F WBS RevAM - v43
212 pages
BGP Secure Routing 1708284503
No ratings yet
BGP Secure Routing 1708284503
82 pages
Vishal Kumar Singh CV - 2024
No ratings yet
Vishal Kumar Singh CV - 2024
3 pages
Chapter 1
No ratings yet
Chapter 1
31 pages
9XR Motherboard Connector Pinout J1 Right Switches Atmega
No ratings yet
9XR Motherboard Connector Pinout J1 Right Switches Atmega
2 pages
API Security Project: Kick Off
No ratings yet
API Security Project: Kick Off
26 pages
Eye Me
No ratings yet
Eye Me
136 pages
100 Teaching Applications For Teachers
No ratings yet
100 Teaching Applications For Teachers
19 pages
CM2 4G GPS Datasheet - 1
No ratings yet
CM2 4G GPS Datasheet - 1
2 pages
Online Examination System Research Paper
No ratings yet
Online Examination System Research Paper
7 pages
History of International Communication
No ratings yet
History of International Communication
6 pages
1 PB
No ratings yet
1 PB
8 pages
(AgileCMMI) Practical Report: CMMI Measurements and Analysis in Agile Environment
50% (2)
(AgileCMMI) Practical Report: CMMI Measurements and Analysis in Agile Environment
12 pages
RM ServiceInterface 202002 en
No ratings yet
RM ServiceInterface 202002 en
34 pages
Orcus Mouse User Manual Instant 825 Sensor
No ratings yet
Orcus Mouse User Manual Instant 825 Sensor
6 pages
SOW - Fixed Cost Contract
No ratings yet
SOW - Fixed Cost Contract
17 pages
Release Notes C Six Cad V 1810
No ratings yet
Release Notes C Six Cad V 1810
5 pages
App Dna Lga
No ratings yet
App Dna Lga
15 pages
Corsair
No ratings yet
Corsair
5 pages
Ibme
No ratings yet
Ibme
4 pages
Python: Learn Python in 24 Hours
From Everand
Python: Learn Python in 24 Hours
Alex Nordeen
4/5 (12)
Learning C++ by Creating Games with UE4
From Everand
Learning C++ by Creating Games with UE4
William Sherif
3/5 (7)
Bash Command Line Pro Tips
From Everand
Bash Command Line Pro Tips
Jason Cannon
4.5/5 (8)
The Mac Terminal Reference and Scripting Primer
From Everand
The Mac Terminal Reference and Scripting Primer
Jay Docherty
4.5/5 (3)
Simplifying Data Science With Python
From Everand
Simplifying Data Science With Python
Billy David millican
No ratings yet
Python Programming: 8 Simple Steps to Learn Python Programming Language in 24 hours! Practical Python Programming for Beginners, Python Commands and Python Language
From Everand
Python Programming: 8 Simple Steps to Learn Python Programming Language in 24 hours! Practical Python Programming for Beginners, Python Commands and Python Language
Norman James
2/5 (1)
50 Recipes for Programming Node.js
From Everand
50 Recipes for Programming Node.js
Jamie Munro
3/5 (4)
Python Programming Concepts
From Everand
Python Programming Concepts
MRB
No ratings yet
Python Advanced Programming: The Guide to Learn Python Programming. Reference with Exercises and Samples About Dynamical Programming, Multithreading, Multiprocessing, Debugging, Testing and More
From Everand
Python Advanced Programming: The Guide to Learn Python Programming. Reference with Exercises and Samples About Dynamical Programming, Multithreading, Multiprocessing, Debugging, Testing and More
Marcus Richards
No ratings yet
Easy Programming for Everyone
From Everand
Easy Programming for Everyone
Umar Asghar
No ratings yet
Quick Python Guide
From Everand
Quick Python Guide
Coder1
No ratings yet
Backend Handbook: for Ruby on Rails Apps
From Everand
Backend Handbook: for Ruby on Rails Apps
Francisco Quintero
1/5 (1)
The 1 Page Python Book
From Everand
The 1 Page Python Book
Barani Kumar
2/5 (1)
BeagleBone Black Cookbook: Over 60 recipes and solutions for inventors, makers, and budding engineers to create projects using the BeagleBone Black
From Everand
BeagleBone Black Cookbook: Over 60 recipes and solutions for inventors, makers, and budding engineers to create projects using the BeagleBone Black
Charles A. Hamilton
No ratings yet
Python For Beginners
From Everand
Python For Beginners
Célio Azevedo
No ratings yet
Python Pranks and Mischief with NLP
From Everand
Python Pranks and Mischief with NLP
Edward Franklin
No ratings yet
Learn Java Programming in 24 Hours
From Everand
Learn Java Programming in 24 Hours
PublishDrive
No ratings yet
Simplified PHP
From Everand
Simplified PHP
James Blanchette
No ratings yet
Python for Beginners: An Introduction to Learn Python Programming with Tutorials and Hands-On Examples
From Everand
Python for Beginners: An Introduction to Learn Python Programming with Tutorials and Hands-On Examples
Nathan Metzler
4/5 (2)
Learn Python through Nursery Rhymes and Fairy Tales: Classic Stories Translated into Python Programs (Coding for Kids and Beginners)
From Everand
Learn Python through Nursery Rhymes and Fairy Tales: Classic Stories Translated into Python Programs (Coding for Kids and Beginners)
Shari Eskenas
5/5 (1)
Pro Tools HD: Advanced Techniques and Workflows
From Everand
Pro Tools HD: Advanced Techniques and Workflows
Edouard Camou
4/5 (1)
Introduction to Python Programming: Do your first steps into programming with python
From Everand
Introduction to Python Programming: Do your first steps into programming with python
Greytower Corp
No ratings yet
VPS Server Setup
From Everand
VPS Server Setup
L Mohan Arun
5/5 (1)
Troubleshooting Ubuntu Server
From Everand
Troubleshooting Ubuntu Server
Bhargav Skanda
No ratings yet
TensorFlow Developer Certificate Exam Practice Tests 2024 Made Easy
From Everand
TensorFlow Developer Certificate Exam Practice Tests 2024 Made Easy
Mr Troy
No ratings yet
Python-Deprecated Library v1.1 Documentation
From Everand
Python-Deprecated Library v1.1 Documentation
Laurent LAPORTE
No ratings yet
Update to Modern C++
From Everand
Update to Modern C++
James Raynard
No ratings yet
Optimal Reaper
From Everand
Optimal Reaper
Markus Rehbach
No ratings yet
Raspberry Pi Server Essentials
From Everand
Raspberry Pi Server Essentials
Piotr J Kula
No ratings yet
How to a Developers Guide to 4k: Developer edition, #3
From Everand
How to a Developers Guide to 4k: Developer edition, #3
Xinc Cyberwizard
No ratings yet
LPIC-1 Primer
From Everand
LPIC-1 Primer
John Greene
4.5/5 (3)
Python and SQLite Development
From Everand
Python and SQLite Development
Agus Kurniawan
No ratings yet
CISCO PACKET TRACER LABS: Best practice of configuring or troubleshooting Network
From Everand
CISCO PACKET TRACER LABS: Best practice of configuring or troubleshooting Network
Mulayam Singh
No ratings yet
How to Create and Manage Mp3 Songs
From Everand
How to Create and Manage Mp3 Songs
Jeff Palmer
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Raspberry Pi For Beginners: How to get the most out of your raspberry pi, including raspberry pi basics, tips and tricks, raspberry pi projects, and more!
From Everand
Raspberry Pi For Beginners: How to get the most out of your raspberry pi, including raspberry pi basics, tips and tricks, raspberry pi projects, and more!
Matthew Oates
No ratings yet
Living with Linux in the Industrial World
From Everand
Living with Linux in the Industrial World
Elaiya Iswera Lallan
No ratings yet
Python Programming Reference Guide: A Comprehensive Guide for Beginners to Master the Basics of Python Programming Language with Practical Coding & Learning Tips
From Everand
Python Programming Reference Guide: A Comprehensive Guide for Beginners to Master the Basics of Python Programming Language with Practical Coding & Learning Tips
Coleman Newton
No ratings yet
All My IT Tech Posts
From Everand
All My IT Tech Posts
Stephen Edwards
No ratings yet
Foundation Course for Advanced Computer Studies
From Everand
Foundation Course for Advanced Computer Studies
Franck Ismael Djédjé
No ratings yet
Hacks..
From Everand
Hacks..
Hunter Davis
No ratings yet
A Beginner's guide to Python
From Everand
A Beginner's guide to Python
Steven Mcananey
No ratings yet
Profound Linux For Users
From Everand
Profound Linux For Users
Onder Teker
No ratings yet
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet
Common Windows, Linux and Web Server Systems Hacking Techniques
From Everand
Common Windows, Linux and Web Server Systems Hacking Techniques
Dr. Hidaia Mahmood Alassouli
No ratings yet
Python: Advanced Guide to Programming Code with Python: Python Computer Programming, #4
From Everand
Python: Advanced Guide to Programming Code with Python: Python Computer Programming, #4
Charlie Masterson
No ratings yet
Inspiring Powershell Articles
From Everand
Inspiring Powershell Articles
Murat Yildirimoglu
No ratings yet
Python: Advanced Guide to Programming Code with Python
From Everand
Python: Advanced Guide to Programming Code with Python
Charlie Masterson
No ratings yet
Programming Concepts in Java
From Everand
Programming Concepts in Java
Robert Burns
No ratings yet
Programming Concepts in Python
From Everand
Programming Concepts in Python
Robert Burns
No ratings yet
Wireless and Mobile Hacking and Sniffing Techniques
From Everand
Wireless and Mobile Hacking and Sniffing Techniques
Dr. Hidaia Mahmood Alassouli
No ratings yet
Hacking of Computer Networks: Full Course on Hacking of Computer Networks
From Everand
Hacking of Computer Networks: Full Course on Hacking of Computer Networks
Dr. Hidaia Mahmood Alassouli
No ratings yet
Footprinting, Reconnaissance, Scanning and Enumeration Techniques of Computer Networks
From Everand
Footprinting, Reconnaissance, Scanning and Enumeration Techniques of Computer Networks
Dr. Hidaia Mahmood Alassouli
No ratings yet
UNIX Shell Programming Interview Questions You'll Most Likely Be Asked
From Everand
UNIX Shell Programming Interview Questions You'll Most Likely Be Asked
Vibrant Publishers
No ratings yet

Deepfilternet

Uploaded by

Deepfilternet

Uploaded by

DeepFilterNet

Step1: Login to huggingface in locally

Step2: download the model

Step3:install the requirements.txt

Step4: install the required packages

Step5:Run the main file

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

def load_audio(file_path, sr=48000):

def measure_noisiness(audio_path, model, sr=48000, noise_threshold=0.5):

if waveform.dim() > 1 and waveform.shape[0] > 1:

noisy_frames = normalized_energy[normalized_energy > noise_threshold]

def translate_text(text, src_lang, dest_lang, max_retries=3):

def segment_audio(audio_path, chunk_length_ms=60000):

def recognize_audio_chunk(chunk, recognizer, language="te-IN",

full_text = " ".join(text_segments)

for telugu_filler, english_filler in zip(telugu_fillers, english_fillers):

for english_filler, count in filler_count.items():

# Measure noisy energy first

if average_noisy_energy <= 0.75:

Output:2024-07-15 07:00:58 | INFO | DF | Loading model settings of

You might also like