|
import gradio as gr |
|
import argparse |
|
import os |
|
import torch |
|
from time import sleep |
|
from tqdm import tqdm |
|
from lang_list import union_language_dict |
|
|
|
from pytube import YouTube |
|
import re |
|
from PIL import Image |
|
import urllib.request |
|
|
|
NUMBER = 100 |
|
DEVICE = "cuda" if torch.cuda.is_available() else "cpu" |
|
DOWNLOAD = True |
|
SLICE_AUDIO = True |
|
SEPARE_VOCALS = False |
|
TRANSCRIBE_AUDIO = True |
|
CONCATENATE_TRANSCRIPTIONS = True |
|
TRANSLATE_TRANSCRIPTIONS = True |
|
ADD_SUBTITLES_TO_VIDEO = True |
|
REMOVE_FILES = False |
|
if DEVICE == "cpu": |
|
|
|
SECONDS = 300 |
|
else: |
|
SECONDS = 300 |
|
|
|
YOUTUBE = "youtube" |
|
TWITCH = "twitch" |
|
ERROR = "error" |
|
|
|
urllib.request.urlretrieve('https://maximofn.com/wp-content/uploads/2023/11/subtify_logo-scaled.webp', "subtify_logo.webp") |
|
subtify_logo = Image.open("subtify_logo.webp") |
|
subtify_logo_width, subtify_logo_height = subtify_logo.size |
|
factor = 5 |
|
new_width = subtify_logo_width // factor |
|
new_height = subtify_logo_height // factor |
|
|
|
html_social_media = ''' |
|
<div style="float: right;"> |
|
<a href="https://maximofn.com/" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/MFN.svg" alt="MFN icon" width="16px"> |
|
</a> |
|
<a href="http://github.com/maximofn" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<svg xmlns="http://www.w3.org/2000/svg" height="1em" viewBox="0 0 496 512"> |
|
<style> |
|
svg { |
|
fill: #f3f4f6; |
|
} |
|
</style> |
|
<path d="M165.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6zm-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3zm44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9zM244.8 8C106.1 8 0 113.3 0 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C428.2 457.8 496 362.9 496 252 496 113.3 383.5 8 244.8 8zM97.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1zm-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7zm32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1zm-11.4-14.7c-1.6 1-1.6 3.6 0 5.9 1.6 2.3 4.3 3.3 5.6 2.3 1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2z"/> |
|
</svg> |
|
</a> |
|
<a href="http://linkedin.com/in/MaximoFN/" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/linkedin.svg" alt="linkedin icon"> |
|
</a> |
|
<a href="https://www.facebook.com/profile.php?id=100085177670661" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/facebook.svg" alt="facebook icon"> |
|
</a> |
|
<a href="https://twitter.com/Maximo_fn" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/x.svg" alt="x icon"> |
|
</a> |
|
<a href="https://www.instagram.com/maximo__fn/" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/instagram.svg" alt="instagram icon"> |
|
</a> |
|
<a href="https://www.tiktok.com/@maximo__fn" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/tiktok.svg" alt="tiktok icon"> |
|
</a> |
|
<a href="https://www.twitch.tv/maximofn/" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/twitch.svg" alt="twitch icon"> |
|
</a> |
|
<a href="https://www.youtube.com/channel/UCdQwg2JU_fWRsHn3yIlf3tw" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/youtube.svg" alt="youtube icon"> |
|
</a> |
|
<a href="http://kaggle.com/maximofn" rel="noopener noreferrer" aria-disabled="false" class="sm secondary svelte-cmf5ev" id="component-1" style="flex-grow: 100;" target="_blank"> |
|
<img src="http://127.0.0.1:7860/file=assets/kaggle.svg" alt="kaggle icon"> |
|
</a> |
|
</div> |
|
''' |
|
|
|
html_subtify_logo = f"<img src='http://127.0.0.1:7860/file=subtify_logo.webp' style='width: {new_width}px; height: {new_height}px; margin-left: auto; margin-right: auto; display: block;'/>" |
|
|
|
html_buy_me_a_coffe = ''' |
|
<div style="float: right;"> |
|
<a href="https://www.buymeacoffee.com/maximofn" target="_blank"> |
|
<img src="https://img.shields.io/badge/Buy_Me_A_Coffee-support_my_work-FFDD00?style=for-the-badge&logo=buy-me-a-coffee&logoColor=white&labelColor=101010" alt="buy me a coffe"> |
|
</a> |
|
</div> |
|
''' |
|
|
|
language_dict = union_language_dict() |
|
|
|
def subtify_no_ui(): |
|
number_works = 7 |
|
progress_bar = tqdm(total=number_works, desc="Subtify") |
|
folder_vocals = "vocals" |
|
folder_chunck = "chunks" |
|
folder_concatenated = "concatenated_transcriptions" |
|
folder_translated_transcriptions = "translated_transcriptions" |
|
if not os.path.exists(folder_vocals): |
|
os.makedirs(folder_vocals) |
|
if not os.path.exists(folder_chunck): |
|
os.makedirs(folder_chunck) |
|
if not os.path.exists(folder_concatenated): |
|
os.makedirs(folder_concatenated) |
|
if not os.path.exists(folder_translated_transcriptions): |
|
os.makedirs(folder_translated_transcriptions) |
|
|
|
|
|
if DOWNLOAD: |
|
print('*'*NUMBER) |
|
|
|
|
|
|
|
url = "https://www.youtube.com/watch?v=dgOBxhi19T8" |
|
|
|
|
|
print(f"Downloading video and audio from {url}") |
|
python_file = "download.py" |
|
command = f"python {python_file} {url}" |
|
os.system(command) |
|
sleep(5) |
|
print('*'*NUMBER) |
|
print("\n\n") |
|
progress_bar.update(1) |
|
|
|
|
|
if SLICE_AUDIO: |
|
print('*'*NUMBER) |
|
print("Slicing audio") |
|
python_file = "slice_audio.py" |
|
audio = "audios/download_audio.mp3" |
|
command = f"python {python_file} {audio} {SECONDS}" |
|
os.system(command) |
|
print('*'*NUMBER) |
|
print("\n\n") |
|
progress_bar.update(1) |
|
|
|
|
|
chunck_file = "chunks/output_files.txt" |
|
print('*'*NUMBER) |
|
if SEPARE_VOCALS: |
|
print("Get vocals") |
|
python_file = "separe_vocals.py" |
|
command = f"python {python_file} {chunck_file} {DEVICE}" |
|
os.system(command) |
|
if REMOVE_FILES: |
|
with open(chunck_file, 'r') as f: |
|
files = f.read().splitlines() |
|
for file in files: |
|
command = f"rm {file}" |
|
os.system(command) |
|
else: |
|
print("Moving chunks") |
|
with open(f"{folder_vocals}/speakers.txt", 'w') as f: |
|
f.write(str(0)) |
|
if REMOVE_FILES: |
|
command = f"mv {folder_chunck}/*.mp3 {folder_vocals}/" |
|
os.system(command) |
|
else: |
|
command = f"cp {folder_chunck}/*.mp3 {folder_vocals}/" |
|
os.system(command) |
|
print('*'*NUMBER) |
|
print("\n\n") |
|
progress_bar.update(1) |
|
|
|
|
|
speakers_file = "vocals/speakers.txt" |
|
if TRANSCRIBE_AUDIO: |
|
print('*'*NUMBER) |
|
print("Transcript vocals") |
|
python_file = "transcribe.py" |
|
language = "English" |
|
command = f"python {python_file} {chunck_file} {language} {speakers_file} {DEVICE} {not SEPARE_VOCALS}" |
|
os.system(command) |
|
if REMOVE_FILES: |
|
vocals_folder = "vocals" |
|
with open(chunck_file, 'r') as f: |
|
files = f.read().splitlines() |
|
with open(speakers_file, 'r') as f: |
|
speakers = f.read().splitlines() |
|
speakers = int(speakers[0]) |
|
for file in files: |
|
if speakers > 0: |
|
vocals_extension = "wav" |
|
for i in range(speakers): |
|
file_name, _ = file.split(".") |
|
_, file_name = file_name.split("/") |
|
vocal = f'{vocals_folder}/{file_name}_speaker{i:003d}.{vocals_extension}' |
|
command = f"rm {vocal}" |
|
os.system(command) |
|
else: |
|
vocals_extension = "mp3" |
|
file_name, _ = file.split(".") |
|
_, file_name = file_name.split("/") |
|
vocal = f'{vocals_folder}/{file_name}.{vocals_extension}' |
|
command = f"rm {vocal}" |
|
os.system(command) |
|
print('*'*NUMBER) |
|
print("\n\n") |
|
progress_bar.update(1) |
|
|
|
|
|
if CONCATENATE_TRANSCRIPTIONS: |
|
print('*'*NUMBER) |
|
print("Concatenate transcriptions") |
|
python_file = "concat_transcriptions.py" |
|
command = f"python {python_file} {chunck_file} {SECONDS} {speakers_file}" |
|
os.system(command) |
|
if REMOVE_FILES: |
|
with open(chunck_file, 'r') as f: |
|
files = f.read().splitlines() |
|
for file in files: |
|
file_name, _ = file.split(".") |
|
_, file_name = file_name.split("/") |
|
transcriptions_folder = "transcriptions" |
|
transcription_extension = "srt" |
|
command = f"rm {transcriptions_folder}/{file_name}.{transcription_extension}" |
|
os.system(command) |
|
print('*'*NUMBER) |
|
print("\n\n") |
|
progress_bar.update(1) |
|
|
|
|
|
target_languaje = "Español" |
|
if TRANSLATE_TRANSCRIPTIONS: |
|
print('*'*NUMBER) |
|
print("Translate transcription") |
|
transcription_file = "concatenated_transcriptions/download_audio.srt" |
|
source_languaje = "English" |
|
python_file = "translate_transcriptions.py" |
|
command = f"python {python_file} {transcription_file} --source_languaje {source_languaje} --target_languaje {target_languaje} --device {DEVICE}" |
|
os.system(command) |
|
if REMOVE_FILES: |
|
command = f"rm {transcription_file}" |
|
os.system(command) |
|
print('*'*NUMBER) |
|
print("\n\n") |
|
progress_bar.update(1) |
|
|
|
|
|
if ADD_SUBTITLES_TO_VIDEO: |
|
print('*'*NUMBER) |
|
print("Add subtitles to video") |
|
python_file = "add_subtitles_to_video.py" |
|
transcription_file = f"translated_transcriptions/download_audio_{target_languaje}.srt" |
|
input_video_file = "videos/download_video.mp4" |
|
input_audio_file = "audios/download_audio.mp3" |
|
command = f"python {python_file} {transcription_file} {input_video_file} {input_audio_file}" |
|
os.system(command) |
|
if REMOVE_FILES: |
|
command = f"rm {input_video_file}" |
|
os.system(command) |
|
command = f"rm {input_audio_file}" |
|
os.system(command) |
|
command = f"rm {transcription_file}" |
|
os.system(command) |
|
command = f"rm chunks/output_files.txt" |
|
os.system(command) |
|
command = f"rm vocals/speakers.txt" |
|
os.system(command) |
|
print('*'*NUMBER) |
|
print("\n\n") |
|
progress_bar.update(1) |
|
|
|
def remove_all_files(): |
|
command = f"rm -r audios" |
|
os.system(command) |
|
command = f"rm -r chunks" |
|
os.system(command) |
|
command = f"rm -r concatenated_transcriptions" |
|
os.system(command) |
|
command = f"rm -r transcriptions" |
|
os.system(command) |
|
command = f"rm -r translated_transcriptions" |
|
os.system(command) |
|
command = f"rm -r videos" |
|
os.system(command) |
|
command = f"rm -r vocals" |
|
os.system(command) |
|
|
|
|
|
|
|
|
|
def reset_frontend(): |
|
visible = False |
|
return ( |
|
"", |
|
gr.Image(visible=visible), |
|
gr.Dropdown(visible=visible), |
|
gr.Dropdown(visible=visible), |
|
gr.Dropdown(visible=visible), |
|
gr.Button(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Textbox(visible=visible), |
|
gr.Video(visible=visible), |
|
) |
|
|
|
def show_auxiliar_block1(): |
|
return gr.Textbox(value="URL checked", visible=True) |
|
|
|
def get_youtube_thumbnail(url): |
|
yt = YouTube(url) |
|
thumbnail_url = yt.thumbnail_url |
|
return thumbnail_url |
|
|
|
def is_valid_youtube_url(url): |
|
|
|
|
|
|
|
|
|
patron_youtube = r'(https?://)?(www\.)?(youtube\.com/watch\?v=|youtu\.be/)[\w-]+' |
|
return bool(re.match(patron_youtube, url)) |
|
|
|
def is_valid_twitch_url(url): |
|
|
|
|
|
|
|
|
|
twitch_pattern = r'(https?://)?(www\.)?twitch\.tv/(videos/\d+|\w+)' |
|
return bool(re.match(twitch_pattern, url)) |
|
|
|
def is_valid_url(url): |
|
num_speaker = [10, 9, 8, 7, 6, 5, 4, 3, 2, 1] |
|
source_languaje = gr.Dropdown(visible=True, label="Source languaje", show_label=True, value="English", choices=language_dict, scale=1, interactive=True) |
|
target_languaje = gr.Dropdown(visible=True, label="Target languaje", show_label=True, value="Español", choices=language_dict, scale=1, interactive=True) |
|
number_of_speakers = gr.Dropdown(visible=True, label="Number of speakers", show_label=True, value=10, choices=num_speaker, scale=1, interactive=True) |
|
subtify_button = gr.Button(size="lg", value="subtify", min_width="10px", scale=0, visible=True) |
|
|
|
|
|
if "youtube" in url.lower() or "youtu.be" in url.lower(): |
|
if is_valid_youtube_url(url): |
|
thumbnail = get_youtube_thumbnail(url) |
|
if thumbnail: |
|
return ( |
|
gr.Image(value=thumbnail, visible=True, show_download_button=False, container=False), |
|
source_languaje, |
|
target_languaje, |
|
number_of_speakers, |
|
subtify_button, |
|
) |
|
else: |
|
return ( |
|
gr.Image(value="assets/youtube-no-thumbnails.webp", visible=True, show_download_button=False, container=False), |
|
source_languaje, |
|
target_languaje, |
|
number_of_speakers, |
|
subtify_button, |
|
) |
|
|
|
|
|
elif "twitch" in url.lower() or "twitch.tv" in url.lower(): |
|
if is_valid_twitch_url(url): |
|
return ( |
|
gr.Image(value="assets/twitch.webp", visible=True, show_download_button=False, container=False), |
|
source_languaje, |
|
target_languaje, |
|
number_of_speakers, |
|
subtify_button, |
|
) |
|
|
|
|
|
visible = False |
|
image = gr.Image(value="assets/youtube_error.webp", visible=visible, show_download_button=False, container=False) |
|
source_languaje = gr.Dropdown(visible=visible, label="Source languaje", show_label=True, value="English", choices=language_dict, scale=1, interactive=True) |
|
target_languaje = gr.Dropdown(visible=visible, label="Target languaje", show_label=True, value="Español", choices=language_dict, scale=1, interactive=True) |
|
number_of_speakers = gr.Dropdown(visible=visible, label="Number of speakers", show_label=True, value=10, choices=num_speaker, scale=1, interactive=True) |
|
subtify_button = gr.Button(size="lg", value="subtify", min_width="10px", scale=0, visible=visible) |
|
return ( |
|
image, |
|
source_languaje, |
|
target_languaje, |
|
number_of_speakers, |
|
subtify_button, |
|
) |
|
|
|
def change_visibility_texboxes(): |
|
|
|
return ( |
|
gr.Textbox(value="Done"), |
|
gr.Textbox(visible=True), |
|
gr.Textbox(visible=True), |
|
gr.Textbox(visible=True), |
|
gr.Textbox(visible=True), |
|
gr.Textbox(visible=True), |
|
gr.Textbox(visible=True), |
|
gr.Textbox(visible=False), |
|
) |
|
|
|
def get_audio_and_video_from_video(url): |
|
python_file = "download.py" |
|
command = f"python {python_file} {url}" |
|
os.system(command) |
|
sleep(1) |
|
|
|
audio = "audios/download_audio.mp3" |
|
video = "videos/download_video.mp4" |
|
|
|
return ( |
|
gr.Textbox(value="Ok"), |
|
gr.Textbox(value=audio), |
|
gr.Textbox(value=video), |
|
) |
|
|
|
def slice_audio(audio_path): |
|
folder_vocals = "vocals" |
|
folder_chunck = "chunks" |
|
if not os.path.exists(folder_vocals): |
|
os.makedirs(folder_vocals) |
|
if not os.path.exists(folder_chunck): |
|
os.makedirs(folder_chunck) |
|
|
|
python_file = "slice_audio.py" |
|
command = f"python {python_file} {audio_path} {SECONDS}" |
|
os.system(command) |
|
|
|
with open(f"{folder_vocals}/speakers.txt", 'w') as f: |
|
f.write(str(0)) |
|
command = f"mv {folder_chunck}/*.mp3 {folder_vocals}/" |
|
os.system(command) |
|
|
|
return ( |
|
gr.Textbox(value="Ok") |
|
) |
|
|
|
def trascribe_audio(source_languaje): |
|
folder_vocals = "vocals" |
|
python_file = "transcribe.py" |
|
chunck_file = "chunks/output_files.txt" |
|
speakers_file = "vocals/speakers.txt" |
|
command = f"python {python_file} {chunck_file} {source_languaje} {speakers_file} {DEVICE} {not SEPARE_VOCALS}" |
|
os.system(command) |
|
|
|
with open(chunck_file, 'r') as f: |
|
files = f.read().splitlines() |
|
with open(speakers_file, 'r') as f: |
|
speakers = f.read().splitlines() |
|
speakers = int(speakers[0]) |
|
for file in files: |
|
if speakers > 0: |
|
vocals_extension = "wav" |
|
for i in range(speakers): |
|
file_name, _ = file.split(".") |
|
_, file_name = file_name.split("/") |
|
vocal = f'{folder_vocals}/{file_name}_speaker{i:003d}.{vocals_extension}' |
|
command = f"rm {vocal}" |
|
os.system(command) |
|
else: |
|
vocals_extension = "mp3" |
|
file_name, _ = file.split(".") |
|
_, file_name = file_name.split("/") |
|
vocal = f'{folder_vocals}/{file_name}.{vocals_extension}' |
|
command = f"rm {vocal}" |
|
os.system(command) |
|
|
|
return ( |
|
gr.Textbox(value="Ok") |
|
) |
|
|
|
def concatenate_transcriptions(): |
|
folder_concatenated = "concatenated_transcriptions" |
|
if not os.path.exists(folder_concatenated): |
|
os.makedirs(folder_concatenated) |
|
|
|
chunck_file = "chunks/output_files.txt" |
|
speakers_file = "vocals/speakers.txt" |
|
python_file = "concat_transcriptions.py" |
|
command = f"python {python_file} {chunck_file} {SECONDS} {speakers_file}" |
|
os.system(command) |
|
|
|
with open(chunck_file, 'r') as f: |
|
files = f.read().splitlines() |
|
for file in files: |
|
file_name, _ = file.split(".") |
|
_, file_name = file_name.split("/") |
|
transcriptions_folder = "transcriptions" |
|
transcription_extension = "srt" |
|
command = f"rm {transcriptions_folder}/{file_name}.{transcription_extension}" |
|
os.system(command) |
|
|
|
audio_transcribed = "concatenated_transcriptions/download_audio.srt" |
|
|
|
return ( |
|
gr.Textbox(value="Ok"), |
|
gr.Textbox(value=audio_transcribed), |
|
) |
|
|
|
def translate_transcription(original_audio_transcribed_path, source_languaje, target_languaje): |
|
folder_translated_transcriptions = "translated_transcriptions" |
|
if not os.path.exists(folder_translated_transcriptions): |
|
os.makedirs(folder_translated_transcriptions) |
|
|
|
python_file = "translate_transcriptions.py" |
|
command = f"python {python_file} {original_audio_transcribed_path} --source_languaje {source_languaje} --target_languaje {target_languaje} --device {DEVICE}" |
|
os.system(command) |
|
|
|
translated_transcription = f"translated_transcriptions/download_audio_{target_languaje}.srt" |
|
|
|
transcription_file = "concatenated_transcriptions/download_audio.srt" |
|
command = f"rm {transcription_file}" |
|
os.system(command) |
|
|
|
return ( |
|
gr.Textbox(value="Ok"), |
|
gr.Textbox(value=translated_transcription) |
|
) |
|
|
|
def add_translated_subtitles_to_video(original_video_path, original_audio_path, original_audio_translated_path): |
|
python_file = "add_subtitles_to_video.py" |
|
command = f"python {python_file} {original_audio_translated_path} {original_video_path} {original_audio_path}" |
|
os.system(command) |
|
|
|
command = f"rm {original_video_path}" |
|
os.system(command) |
|
command = f"rm {original_audio_path}" |
|
os.system(command) |
|
command = f"rm {original_audio_translated_path}" |
|
os.system(command) |
|
command = f"rm chunks/output_files.txt" |
|
os.system(command) |
|
command = f"rm vocals/speakers.txt" |
|
os.system(command) |
|
|
|
subtitled_video = "videos/download_video_with_subtitles.mp4" |
|
|
|
return ( |
|
gr.Textbox(value="Ok"), |
|
gr.Video(value=subtitled_video, visible=True), |
|
) |
|
|
|
def subtify(): |
|
with gr.Blocks() as demo: |
|
num_speaker = [10, 9, 8, 7, 6, 5, 4, 3, 2, 1] |
|
|
|
|
|
gr.Markdown(html_social_media) |
|
gr.Markdown("<h1 style='text-align: center;'>Subtify</h1>") |
|
gr.Markdown(html_subtify_logo) |
|
with gr.Row(variant="panel"): |
|
url_textbox = gr.Textbox(placeholder="Add video URL here", label="Video URL", elem_id="video_url", scale=1, interactive=True) |
|
|
|
delete_button = gr.Button(size="sm", icon="icons/delete.svg", value="", min_width="10px", scale=0) |
|
|
|
visible = False |
|
auxiliar_block1 = gr.Textbox(label="Auxiliar block 1", elem_id="auxiliar_block1", interactive=False, visible=visible) |
|
with gr.Row(equal_height=False): |
|
image = gr.Image(visible=visible, scale=1) |
|
with gr.Column(): |
|
with gr.Row(): |
|
source_languaje = gr.Dropdown(visible=visible, label="Source languaje", show_label=True, value="English", choices=language_dict, scale=1, interactive=True, info="Language of the video") |
|
target_languaje = gr.Dropdown(visible=visible, label="Target languaje", show_label=True, value="Español", choices=language_dict, scale=1, interactive=True, info="Language to translate the subtitles") |
|
number_of_speakers = gr.Dropdown(visible=visible, label="Number of speakers", show_label=True, value=10, choices=num_speaker, scale=1, interactive=True, info="Number of speakers in the video, if you don't know, select 10") |
|
with gr.Row(): |
|
subtify_button = gr.Button(size="lg", value="subtify", min_width="10px", scale=0, visible=visible) |
|
|
|
auxiliar_block2 = gr.Textbox(placeholder="Waiting", label="Auxiliar block 2", elem_id="auxiliar_block2", interactive=False, visible=visible) |
|
with gr.Row(): |
|
video_donwloaded_progress_info = gr.Textbox(placeholder="Waiting", label="Video downloaded progress info", elem_id="video_donwloaded_progress_info", interactive=False, visible=visible) |
|
video_sliced_progress_info = gr.Textbox(placeholder="Waiting", label="Video sliced progress info", elem_id="video_sliced_progress_info", interactive=False, visible=visible) |
|
video_transcribed_progress_info = gr.Textbox(placeholder="Waiting", label="Video transcribed progress info", elem_id="video_transcribed_progress_info", interactive=False, visible=visible) |
|
transcriptions_concatenated_progress_info = gr.Textbox(placeholder="Waiting", label="Transcriptions concatenated progress info", elem_id="transcriptions_concatenated_progress_info", interactive=False, visible=visible) |
|
video_translated_progress_info = gr.Textbox(placeholder="Waiting", label="Transcription translated progress info", elem_id="transcription_translated_progress_info", interactive=False, visible=visible) |
|
video_subtitled_progress_info = gr.Textbox(placeholder="Waiting", label="Video subtitled progress info", elem_id="video_subtitled_progress_info", interactive=False, visible=visible) |
|
|
|
original_audio_path = gr.Textbox(label="Original audio path", elem_id="original_audio_path", visible=visible) |
|
original_video_path = gr.Textbox(label="Original video path", elem_id="original_video_path", visible=visible) |
|
original_audio_transcribed_path = gr.Textbox(label="Original audio transcribed", elem_id="original_audio_transcribed", visible=visible) |
|
original_audio_translated_path = gr.Textbox(label="Original audio translated", elem_id="original_audio_translated", visible=visible) |
|
subtitled_video = gr.Video(label="Subtitled video", elem_id="subtitled_video", visible=visible, interactive=visible) |
|
|
|
|
|
|
|
delete_button.click( |
|
fn=reset_frontend, |
|
outputs=[ |
|
url_textbox, |
|
image, |
|
source_languaje, |
|
target_languaje, |
|
number_of_speakers, |
|
subtify_button, |
|
auxiliar_block2, |
|
video_donwloaded_progress_info, |
|
video_sliced_progress_info, |
|
video_transcribed_progress_info, |
|
transcriptions_concatenated_progress_info, |
|
video_translated_progress_info, |
|
video_subtitled_progress_info, |
|
subtitled_video, |
|
] |
|
) |
|
url_textbox.change( |
|
fn=show_auxiliar_block1, |
|
outputs=[auxiliar_block1] |
|
) |
|
auxiliar_block1.change( |
|
fn=is_valid_url, |
|
inputs=url_textbox, |
|
outputs=[image, source_languaje, target_languaje, number_of_speakers, subtify_button] |
|
) |
|
subtify_button.click( |
|
fn=change_visibility_texboxes, |
|
outputs=[auxiliar_block2, video_donwloaded_progress_info, video_sliced_progress_info, video_transcribed_progress_info, transcriptions_concatenated_progress_info, video_translated_progress_info, video_subtitled_progress_info, auxiliar_block1] |
|
) |
|
auxiliar_block2.change( |
|
fn=get_audio_and_video_from_video, |
|
inputs=[url_textbox], |
|
outputs=[video_donwloaded_progress_info, original_audio_path, original_video_path] |
|
) |
|
video_donwloaded_progress_info.change( |
|
fn=slice_audio, |
|
inputs=[original_audio_path], |
|
outputs=[video_sliced_progress_info] |
|
) |
|
video_sliced_progress_info.change( |
|
fn=trascribe_audio, |
|
inputs=[source_languaje], |
|
outputs=[video_transcribed_progress_info] |
|
) |
|
video_transcribed_progress_info.change( |
|
fn=concatenate_transcriptions, |
|
outputs=[transcriptions_concatenated_progress_info, original_audio_transcribed_path] |
|
) |
|
transcriptions_concatenated_progress_info.change( |
|
fn=translate_transcription, |
|
inputs=[original_audio_transcribed_path, source_languaje, target_languaje], |
|
outputs=[video_translated_progress_info, original_audio_translated_path] |
|
) |
|
video_translated_progress_info.change( |
|
fn=add_translated_subtitles_to_video, |
|
inputs=[original_video_path, original_audio_path, original_audio_translated_path], |
|
outputs=[video_subtitled_progress_info, subtitled_video] |
|
) |
|
|
|
gr.Markdown(html_buy_me_a_coffe) |
|
|
|
demo.launch() |
|
|
|
|
|
if __name__ == "__main__": |
|
parser = argparse.ArgumentParser() |
|
parser.add_argument("--no_ui", action="store_true") |
|
parser.add_argument("--remove_all_files", action="store_true") |
|
args = parser.parse_args() |
|
|
|
if args.no_ui: |
|
subtify_no_ui() |
|
elif args.remove_all_files: |
|
remove_all_files() |
|
else: |
|
subtify() |