Spaces:
Sleeping
Sleeping
import streamlit as st | |
from streamlit_lottie import st_lottie | |
from utils import write_vtt, write_srt | |
from flores200_codes import flores_codes | |
import ffmpeg | |
import requests | |
from typing import Iterator | |
from io import StringIO | |
import numpy as np | |
import pathlib | |
import os | |
st.set_page_config(page_title="Captions", page_icon=":movie_camera:", layout="wide") | |
# Sema Translator | |
Public_Url = 'https://lewiskimaru-helloworld.hf.space' #endpoint | |
# Define a function that we can use to load lottie files from a link. | |
def load_lottieurl(url: str): | |
r = requests.get(url) | |
if r.status_code != 200: | |
return None | |
return r.json() | |
APP_DIR = pathlib.Path(__file__).parent.absolute() | |
LOCAL_DIR = APP_DIR / "local_transcript" | |
LOCAL_DIR.mkdir(exist_ok=True) | |
save_dir = LOCAL_DIR / "output" | |
save_dir.mkdir(exist_ok=True) | |
col1, col2 = st.columns([1, 3]) | |
with col1: | |
lottie = load_lottieurl("https://assets6.lottiefiles.com/packages/lf20_cjnxwrkt.json") | |
st_lottie(lottie) | |
with col2: | |
st.write(""" | |
## Sema Captions | |
##### β Upload a video file and a transcript as .srt or .vtt file and get a video with subtitles.""") | |
def getSubs(segments: Iterator[dict], format: str, maxLineWidth: int) -> str: | |
segmentStream = StringIO() | |
if format == 'vtt': | |
write_vtt(segments, file=segmentStream, maxLineWidth=maxLineWidth) | |
elif format == 'srt': | |
write_srt(segments, file=segmentStream, maxLineWidth=maxLineWidth) | |
else: | |
raise Exception("Unknown format " + format) | |
segmentStream.seek(0) | |
return segmentStream.read() | |
def split_video_audio(uploaded_file): | |
with open(f"{save_dir}/input.mp4", "wb") as f: | |
f.write(uploaded_file.read()) | |
audio = ffmpeg.input(f"{save_dir}/input.mp4") | |
audio = ffmpeg.output(audio, f"{save_dir}/output.wav", acodec="pcm_s16le", ac=1, ar="16k") | |
ffmpeg.run(audio, overwrite_output=True) | |
def translate(userinput, target_lang, source_lang=None): | |
if source_lang: | |
url = f"{Public_Url}/translate_enter/" | |
data = { | |
"userinput": userinput, | |
"source_lang": source_lang, | |
"target_lang": target_lang, | |
} | |
response = requests.post(url, json=data) | |
result = response.json() | |
print(type(result)) | |
source_lange = source_lang | |
translation = result['translated_text'] | |
else: | |
url = f"{Public_Url}/translate_detect/" | |
data = { | |
"userinput": userinput, | |
"target_lang": target_lang, | |
} | |
response = requests.post(url, json=data) | |
result = response.json() | |
source_lange = result['source_language'] | |
translation = result['translated_text'] | |
return source_lange, translation | |
def main(): | |
uploaded_video = st.file_uploader("Upload Video File", type=["mp4", "avi", "mov", "mkv"]) | |
# get the name of the input_file | |
if uploaded_video is not None: | |
filename = uploaded_video.name[:-4] | |
else: | |
filename = None | |
transcript_file = st.file_uploader("Upload Transcript File", type=["srt", "vtt"]) | |
if transcript_file is not None: | |
transcript_name = transcript_file.name | |
else: | |
transcript_name = None | |
if uploaded_video is not None and transcript_file is not None: | |
if transcript_name[-3:] == "vtt": | |
with open("uploaded_transcript.vtt", "wb") as f: | |
f.writelines(transcript_file) | |
f.close() | |
with open(os.path.join(os.getcwd(), "uploaded_transcript.vtt"), "rb") as f: | |
vtt_file = f.read() | |
if st.button("Generate Video with Subtitles"): | |
with st.spinner("Generating Subtitled Video"): | |
split_video_audio(uploaded_video) | |
video_file = ffmpeg.input(f"{save_dir}/input.mp4") | |
audio_file = ffmpeg.input(f"{save_dir}/output.wav") | |
ffmpeg.concat(video_file.filter("subtitles", "uploaded_transcript.vtt"), audio_file, v=1, a=1).output("final.mp4").global_args('-report').run(quiet=True, overwrite_output=True) | |
video_with_subs = open("final.mp4", "rb") | |
col3, col4 = st.columns(2) | |
with col3: | |
st.video(uploaded_video) | |
with col4: | |
st.video(video_with_subs) | |
st.download_button(label="Download Video with Subtitles", | |
data=video_with_subs, | |
file_name=f"{filename}_with_subs.mp4") | |
elif transcript_name[-3:] == "srt": | |
with open("uploaded_transcript.srt", "wb") as f: | |
f.writelines(transcript_file) | |
f.close() | |
with open(os.path.join(os.getcwd(), "uploaded_transcript.srt"), "rb") as f: | |
srt_file = f.read() | |
if st.button("Generate Video with Subtitles"): | |
with st.spinner("Generating Subtitled Video"): | |
split_video_audio(uploaded_video) | |
video_file = ffmpeg.input(f"{save_dir}/input.mp4") | |
audio_file = ffmpeg.input(f"{save_dir}/output.wav") | |
ffmpeg.concat(video_file.filter("subtitles", "uploaded_transcript.srt"), audio_file, v=1, a=1).output("final.mp4").run(quiet=True, overwrite_output=True) | |
video_with_subs = open("final.mp4", "rb") | |
col3, col4 = st.columns(2) | |
with col3: | |
st.video(uploaded_video) | |
with col4: | |
st.video(video_with_subs) | |
st.download_button(label="Download Video with Subtitles", | |
data=video_with_subs, | |
file_name=f"{filename}_with_subs.mp4") | |
else: | |
st.error("Please upload a .srt or .vtt file") | |
else: | |
st.info("Please upload a video file and a transcript file ") | |
if __name__ == "__main__": | |
main() | |
st.markdown("###### ") | |
st.markdown("###### Powered by [sema Β© 2024](https://www.sema.wiki)") | |