0% found this document useful (0 votes)

6 views6 pages

From Import Import Import: None Def Global Global in F

Uploaded by

Matheus Nakade

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

6 views6 pages

From Import Import Import: None Def Global Global in F

Uploaded by

Matheus Nakade

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 6

!

pip install TTS

!pip install numpy==1.24.0

from google.colab import files

import os
import subprocess

uploaded = None

def upload_video():
global uploaded
global video_path
uploaded = files.upload()
for filename in uploaded.keys():
print(f'Uploaded {filename}')
video_path = filename
return filename

import ipywidgets as widgets

from IPython.display import display

button = widgets.Button(description="Upload Video")

output = widgets.Output()

def on_button_clicked(b):
with output:
global video_path
video_path = upload_video()

button.on_click(on_button_clicked)
display(button, output)

!pip install googletrans==3.1.0a0

import subprocess
from tqdm.notebook import tqdm
import time

# Ensure video_path variable exists

if 'video_path' in globals() and video_path is not None:
ffmpeg_command = f"ffmpeg -i '{video_path}' -acodec pcm_s24le -ar 48000 -q:a 0 -
map a -y 'output_audio.wav'"
start_time = time.time() # Inicia a contagem do tempo
subprocess.run(ffmpeg_command, shell=True)
end_time = time.time() # Termina a contagem do tempo
duration = end_time - start_time
print(f"Conversão de áudio concluída em {duration:.2f} segundos.")
else:
print("No video uploaded. Please upload a video first.")
import whisper

model = whisper.load_model("base")
# Transcreva o áudio original e salve o resultado em um arquivo de texto
result_original = model.transcribe("output_audio.wav", verbose=True, fp16=False,
language='pt')
with open("legendas_original.txt", "w") as f:
f.write(result_original["text"])

print("Legendas para o áudio original salvas em legendas_original.txt")

start_time = time.time() # Inicia a contagem do tempo
result = model.transcribe("output_audio.wav", verbose=True, fp16=False,
language='pt') # Força o Whisper a detectar Português
end_time = time.time() # Termina a contagem do tempo
duration = end_time - start_time
print(f"Transcrição concluída em {duration:.2f} segundos.")

whisper_text = result["text"]
whisper_language = result['language']

print("Texto transcrito:", whisper_text)

print("Idioma original (detectado como Português):", whisper_language)

!pip install googletrans==3.1.0a0 # Downgrade para uma versão que funcione

target_language = "English" #@param ["English", "Spanish", "French", "German",

"Italian", "Portuguese", "Polish", "Turkish", "Russian", "Dutch", "Czech",
"Arabic", "Chinese (Simplified)"]

# Mapping between full names and ISO 639-1 codes

language_mapping = {
'English': 'en',
'Spanish': 'es',
'French': 'fr',
'German': 'de',
'Italian': 'it',
'Portuguese': 'pt',
'Polish': 'pl',
'Turkish': 'tr',
'Russian': 'ru',
'Dutch': 'nl',
'Czech': 'cs',
'Arabic': 'ar',
'Chinese (Simplified)': 'zh-cn'
}

target_language_code = language_mapping[target_language]

from googletrans import Translator

translator = Translator()

# Adiciona um atraso para evitar limitação de taxa

time.sleep(1)
# Salve o texto traduzido em um arquivo de texto
with open("legendas_traduzidas.txt", "w") as f:
f.write(translated_text)

print("Legendas para o áudio traduzido salvas em legendas_traduzidas.txt")

# Lida com potenciais erros na tradução
try:
start_time = time.time() # Inicia a contagem do tempo
translated_text = translator.translate(whisper_text,
dest=target_language_code).text # Traduz do Português detectado
end_time = time.time() # Termina a contagem do tempo
duration = end_time - start_time
print(f"Tradução concluída em {duration:.2f} segundos.")
print(f"Texto traduzido para {target_language}:", translated_text)
except Exception as e:
print(f"Translation failed: {e}")
print("Objeto retornado:", translator.translate(whisper_text,
dest=target_language_code))

from TTS.api import TTS

import torch
from IPython.display import Audio, display

# Criação da instância do modelo TTS corrigida para uso da CPU

tts = TTS("tts_models/multilingual/multi-dataset/xtts_v2").to("cpu")

# Gerando o áudio
tts.tts_to_file(
translated_text,
speaker_wav='output_audio.wav',
file_path="output_synth.wav",
language=target_language_code
)

audio_widget = Audio(filename="output_synth.wav", autoplay=False)

display(audio_widget)

If you are on Google Colab free version (T4), Delete TTS and Whisper at this step

import torch

try:
del tts
except NameError:
print("Voice model already deleted")
try:
del model
except NameError:
print("Whisper model already deleted")

torch.cuda.empty_cache()

Lip Sync - High Quality

Takes arround 15 mins approx for installation on free colab version (T4)

# Dependencies
%cd /content/

import locale
locale.getpreferredencoding = lambda: "UTF-8"

!git clone https://github.com/vinthony/video-retalking.git &> /dev/null

!sudo apt-get install -y libblas-dev liblapack-dev libx11-dev libopenblas-dev

!git clone https://github.com/davisking/dlib.git

!pip install basicsr==1.4.2 face-alignment==1.3.4 kornia==0.5.1 ninja==1.10.2.3

einops==0.4.1 facexlib==0.2.5 librosa==0.9.2 build

!cd dlib && python setup.py install

%cd /content/video-retalking

!mkdir ./checkpoints
!wget
https://github.com/vinthony/video-retalking/releases/download/v0.0.1/30_net_gen.pth
-O ./checkpoints/30_net_gen.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/BFM.zip
-O ./checkpoints/BFM.zip
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/DNet.pt
-O ./checkpoints/DNet.pt
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/ENet.pth
-O ./checkpoints/ENet.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/
expression.mat -O ./checkpoints/expression.mat
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/
face3d_pretrain_epoch_20.pth -O ./checkpoints/face3d_pretrain_epoch_20.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/
GFPGANv1.3.pth -O ./checkpoints/GFPGANv1.3.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/GPEN-
BFR-512.pth -O ./checkpoints/GPEN-BFR-512.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/LNet.pth
-O ./checkpoints/LNet.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/
ParseNet-latest.pth -O ./checkpoints/ParseNet-latest.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/
RetinaFace-R50.pth -O ./checkpoints/RetinaFace-R50.pth
!wget https://github.com/vinthony/video-retalking/releases/download/v0.0.1/
shape_predictor_68_face_landmarks.dat -O
./checkpoints/shape_predictor_68_face_landmarks.dat
!unzip -d ./checkpoints/BFM ./checkpoints/BFM.zip

#Generate video

%cd /content/video-retalking

video_path_fix = f"'../{video_path}'"

!python inference.py \
--face $video_path_fix \
--audio "/content/output_synth.wav" \
--outfile '/content/output_high_qual.mp4'

Download videos
from google.colab import files
from IPython.core.display import display, HTML
import ipywidgets as widgets
import base64
import os

# List of video paths to check

video_paths = ["/content/output_video.mp4", "/content/output_high_qual.mp4"]

def download_video(b):
files.download(b.video_path)

download_buttons = []

# Layout definition for button

button_layout = widgets.Layout(width='250px')

# Loop through each video path to check for existence and display
for video_path in video_paths:
if os.path.exists(video_path):
# Encode video base64
with open(video_path, "rb") as video_file:
video_base64 = base64.b64encode(video_file.read()).decode()

# HTML widget for video

video_html = HTML(data=f"""
<video width=400 controls>
<source src="data:video/mp4;base64,{video_base64}" type="video/mp4" />
</video>
""")

# button widget for download and link to the video path

download_button = widgets.Button(description=f"Download
{os.path.basename(video_path)}",
layout=button_layout)
download_button.video_path = video_path
download_button.on_click(download_video)
download_buttons.append(download_button)

# Display widgets
display(video_html)
display(download_button)

Sre Assignment
No ratings yet
Sre Assignment
15 pages
Deep Fake For Free - Ipynb
No ratings yet
Deep Fake For Free - Ipynb
5 pages
6725133c9e12e9db65ccf8d9 Mopumiwejapov
No ratings yet
6725133c9e12e9db65ccf8d9 Mopumiwejapov
2 pages
From Import Import Import: None Def Global Global in F
No ratings yet
From Import Import Import: None Def Global Global in F
6 pages
Codigocompleto
No ratings yet
Codigocompleto
7 pages
Build A Python Web Application That Turns Voice Into Text Into Image - by Andrew
No ratings yet
Build A Python Web Application That Turns Voice Into Text Into Image - by Andrew
17 pages
Jarvis
No ratings yet
Jarvis
7 pages
Video Api Endpoint N
No ratings yet
Video Api Endpoint N
7 pages
Project Phase 4 Ibm
No ratings yet
Project Phase 4 Ibm
8 pages
ATI Ipynb
No ratings yet
ATI Ipynb
12 pages
Evolution of Hacking - Ronit Chakraborty
No ratings yet
Evolution of Hacking - Ronit Chakraborty
59 pages
Source Code PDF
No ratings yet
Source Code PDF
4 pages
Comandos para Transcrição
No ratings yet
Comandos para Transcrição
2 pages
Voice Cloning Translation Setup
No ratings yet
Voice Cloning Translation Setup
4 pages
Overview
No ratings yet
Overview
2 pages
Speech Image Translator Presentation
No ratings yet
Speech Image Translator Presentation
16 pages
Codefp 1
No ratings yet
Codefp 1
15 pages
New Rich Text Document
No ratings yet
New Rich Text Document
4 pages
New Rich Document
No ratings yet
New Rich Document
4 pages
Agent
No ratings yet
Agent
20 pages
Voice Identification GLM4 Guide
No ratings yet
Voice Identification GLM4 Guide
2 pages
Voice Assistant - Doge: Bachelor of Engineering IN Computer Science & Engineering
No ratings yet
Voice Assistant - Doge: Bachelor of Engineering IN Computer Science & Engineering
48 pages
Jarvis For Windows
No ratings yet
Jarvis For Windows
1 page
Code For Virtual Assistant With GUI
No ratings yet
Code For Virtual Assistant With GUI
3 pages
Alexa Mejorado Tarea #4
No ratings yet
Alexa Mejorado Tarea #4
2 pages
RVCV2 Tools Mocci - Ipynb
No ratings yet
RVCV2 Tools Mocci - Ipynb
17 pages
Name: Haseeb Arif Reg No: SP18-BSE-087 Date of Submission: May 10, 2020. Submitted To: Ms. Saira Beg
100% (2)
Name: Haseeb Arif Reg No: SP18-BSE-087 Date of Submission: May 10, 2020. Submitted To: Ms. Saira Beg
7 pages
Go4braindumps 1z0 909 Mysql 8.0 Database Developer Verified Questions Answers by Reeves 24-05-2024 12qa
No ratings yet
Go4braindumps 1z0 909 Mysql 8.0 Database Developer Verified Questions Answers by Reeves 24-05-2024 12qa
19 pages
Thank You
No ratings yet
Thank You
23 pages
Speech To Text Conversion
No ratings yet
Speech To Text Conversion
7 pages
Import Subprocess
No ratings yet
Import Subprocess
8 pages
Ex 4
No ratings yet
Ex 4
2 pages
AI Voice Assistant
No ratings yet
AI Voice Assistant
51 pages
Digital Bot (En)
No ratings yet
Digital Bot (En)
20 pages
Exercise 8
No ratings yet
Exercise 8
2 pages
Wireless Security Camera PC530
No ratings yet
Wireless Security Camera PC530
100 pages
TSA Lab 2
No ratings yet
TSA Lab 2
3 pages
Criar Legenda
No ratings yet
Criar Legenda
2 pages
Video Processing Guii
No ratings yet
Video Processing Guii
5 pages
PERT (Programme Evaluation and Review Techniques) CPM (Critical Path Methods)
No ratings yet
PERT (Programme Evaluation and Review Techniques) CPM (Critical Path Methods)
34 pages
Setting Up Packages For Speech Recognition
No ratings yet
Setting Up Packages For Speech Recognition
3 pages
Puit XX
No ratings yet
Puit XX
97 pages
Voice M
No ratings yet
Voice M
19 pages
This Script To Watch Videos in Twiter
No ratings yet
This Script To Watch Videos in Twiter
4 pages
Text To Voice and Sync For Video
No ratings yet
Text To Voice and Sync For Video
2 pages
Shashank
No ratings yet
Shashank
2 pages
Large Language Models Are Very Good-Video 6
No ratings yet
Large Language Models Are Very Good-Video 6
2 pages
File
No ratings yet
File
14 pages
Labs 9
No ratings yet
Labs 9
4 pages
Voice Assistant Suggetion
No ratings yet
Voice Assistant Suggetion
3 pages
Test SDHGFJHDF'
No ratings yet
Test SDHGFJHDF'
5 pages
Code
No ratings yet
Code
4 pages
Voice Assistant Report
No ratings yet
Voice Assistant Report
4 pages
Personal Assistant Bot
No ratings yet
Personal Assistant Bot
7 pages
Make The Future Ai and Provide Code Also
No ratings yet
Make The Future Ai and Provide Code Also
21 pages
Jarvis
No ratings yet
Jarvis
8 pages
House of Leaves (TV Pilot Script)
No ratings yet
House of Leaves (TV Pilot Script)
60 pages
Assistant
No ratings yet
Assistant
2 pages
VCS-SH30 Datasheet20221011
No ratings yet
VCS-SH30 Datasheet20221011
2 pages
Ai Lab 02
No ratings yet
Ai Lab 02
12 pages
Computer Python Voice Chatbot
No ratings yet
Computer Python Voice Chatbot
25 pages
Benefits of Lift-and-Shift Strategy For Cloud Migration: Compute Storage Network On-Premise Infrastructure
No ratings yet
Benefits of Lift-and-Shift Strategy For Cloud Migration: Compute Storage Network On-Premise Infrastructure
22 pages
V Assist
No ratings yet
V Assist
3 pages
Echograph 1090-1091 Avg Dac e 2006 06
No ratings yet
Echograph 1090-1091 Avg Dac e 2006 06
2 pages
Quick Start - RAGFlow
No ratings yet
Quick Start - RAGFlow
10 pages
Py Report
No ratings yet
Py Report
8 pages
Jal Jeera
No ratings yet
Jal Jeera
3 pages
Jarvis
No ratings yet
Jarvis
4 pages
Python Codes To Deign A Chatbot
No ratings yet
Python Codes To Deign A Chatbot
3 pages
Import Datetime
No ratings yet
Import Datetime
6 pages
Colqwen2 Similarity Maps Cookbook
No ratings yet
Colqwen2 Similarity Maps Cookbook
8 pages
HCI - 01 Lecture Slides
No ratings yet
HCI - 01 Lecture Slides
26 pages
Arduino OLED Thermometer and Hygrometer With DHT11
No ratings yet
Arduino OLED Thermometer and Hygrometer With DHT11
6 pages
Unit 5 - SE - Notes
No ratings yet
Unit 5 - SE - Notes
45 pages
Jarvis Voice Assistant
No ratings yet
Jarvis Voice Assistant
2 pages
Huawei Optix Osn 580 Datasheet
No ratings yet
Huawei Optix Osn 580 Datasheet
4 pages
SE Assignment Questions
No ratings yet
SE Assignment Questions
2 pages
Cellular Phones
No ratings yet
Cellular Phones
4 pages
MaceMM InstallGuide E PDF
No ratings yet
MaceMM InstallGuide E PDF
36 pages
Blockchain Based Framework For Software Development Using DevOps
No ratings yet
Blockchain Based Framework For Software Development Using DevOps
6 pages
BA Resume
No ratings yet
BA Resume
6 pages
Smart Attendance Using MAC Address
No ratings yet
Smart Attendance Using MAC Address
87 pages
Wa0141.
No ratings yet
Wa0141.
22 pages
12CS em 2025
No ratings yet
12CS em 2025
193 pages
Notes Co Unit4
No ratings yet
Notes Co Unit4
12 pages
Karl Ove Knausgaard: The Man, The Myth, The Legend
No ratings yet
Karl Ove Knausgaard: The Man, The Myth, The Legend
18 pages
ch1 - Database System Concepts
No ratings yet
ch1 - Database System Concepts
17 pages
Developer For Energy and Climate Systems Plugin For Grasshopper, Rhino (80-) - New
No ratings yet
Developer For Energy and Climate Systems Plugin For Grasshopper, Rhino (80-) - New
1 page
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
From Everand
Oracle Certified Professional Java Programmer OCPJP 1Z0 809
Manish Soni
No ratings yet

From Import Import Import: None Def Global Global in F

Uploaded by

From Import Import Import: None Def Global Global in F

Uploaded by

!

pip install TTS

from google.colab import files

import ipywidgets as widgets

button = widgets.Button(description="Upload Video")

!pip install googletrans==3.1.0a0

# Ensure video_path variable exists

print("Legendas para o áudio original salvas em legendas_original.txt")

print("Texto transcrito:", whisper_text)

!pip install googletrans==3.1.0a0 # Downgrade para uma versão que funcione

target_language = "English" #@param ["English", "Spanish", "French", "German",

# Mapping between full names and ISO 639-1 codes

from googletrans import Translator

# Adiciona um atraso para evitar limitação de taxa

print("Legendas para o áudio traduzido salvas em legendas_traduzidas.txt")

from TTS.api import TTS

# Criação da instância do modelo TTS corrigida para uso da CPU

audio_widget = Audio(filename="output_synth.wav", autoplay=False)

Lip Sync - High Quality

!git clone https://github.com/vinthony/video-retalking.git &> /dev/null

!sudo apt-get install -y libblas-dev liblapack-dev libx11-dev libopenblas-dev

!git clone https://github.com/davisking/dlib.git

!pip install basicsr==1.4.2 face-alignment==1.3.4 kornia==0.5.1 ninja==1.10.2.3

!cd dlib && python setup.py install

# List of video paths to check

# Layout definition for button

# HTML widget for video

# button widget for download and link to the video path

You might also like