Spaces:

deven367
/

yt-video-annotator-hf

Sleeping

File size: 2,644 Bytes

6dae90f
 
 
aadeb1f
 
 
6dae90f
 
 
 
 
 
 
 
 
 
 
 
 
aadeb1f
6dae90f
 
 
 
 
 
 
aadeb1f
 
 
 
6dae90f
 
 
2433253
 
 
 
d1a4980
2433253
 
 
 
 
aadeb1f
2433253
aadeb1f
6dae90f
2433253
 
6dae90f
2433253
 
 
6dae90f
 
 
 
 
2433253
6dae90f
 
 
2433253
6dae90f
2433253
 
 
 
 
 
 
 
6dae90f
2433253
 
 
 
 
 
 
 
 
6dae90f
2433253
6dae90f
aadeb1f
 
 
 
 
 
6dae90f

from pathlib import Path

import numpy as np
import streamlit as st
from fastcore.xtras import globtastic

from annotator.utils import (
    annotate,
    df_from_result,
    find_word_timestamp,
    generate_srt,
    get_audio,
    get_v_from_url,
    working_directory,
    write_srt,
)

st.set_page_config(layout="wide")


SRT_PATH = Path("srt")
if not SRT_PATH.exists():
    SRT_PATH.mkdir()

AUDIO_PATH = Path("./audio")
if not AUDIO_PATH.exists():
    AUDIO_PATH.mkdir()


def make_sidebar():
    with st.sidebar:
        st.markdown("## yt-video-annotator")
        st.write("Link to the GitHub repo")


def caption_from_url(url):
    audio_src = get_audio(url)
    v = get_v_from_url(url)
    audio_src = globtastic(AUDIO_PATH, file_glob="*.wav", file_re=v)[0]
    result = annotate(audio_src)
    df = df_from_result(result)
    return audio_src, df


def main():
    url, name = None, None
    make_sidebar()
    place = "https://www.youtube.com/watch?v=C0DPdy98e4c&ab_channel=SimonYapp"
    col1, col2 = st.columns([1.2, 1])
    with col1:
        url = st.text_input("Enter URL for the YT video", place)
        st.video(url)

    with col2:
        default_opt = "Search for words"
        opt = st.radio(
            "What do you wish to do?",
            [default_opt, "Generate subtitles for the entire video"],
        )
        if opt == default_opt:
            st.markdown("### Search for words in the video")
            words = st.text_input("Enter words separated by a comma")
            words = words.split(",")

            if st.button("Get Timestamps"):
                audio_src, df = caption_from_url(url)
                times = find_word_timestamp(df, *words)
                times = np.asarray(times).reshape(len(words), -1)
                # st.write(times)
                for i, word in enumerate(words):
                    st.write(f"{word} is said on {times[i].flatten()} timestamp")

        else:
            if st.button("Generate SRT"):
                audio_src, df = caption_from_url(url)
                name = Path(audio_src).stem
                s = generate_srt(df)
                with working_directory(SRT_PATH):
                    write_srt(s, name)

        if name is not None:
            with working_directory(SRT_PATH):
                key = get_v_from_url(url)
                srt = globtastic(".", file_glob="*.srt", file_re=key)[0]
                with open(srt) as f:
                    st.download_button("Download SRT", f, file_name=f"{name}.srt")

    # subprocess.run(['rm', '-rf', 'audio'])
    # subprocess.run(['rm', '-rf', 'srt'])


if __name__ == "__main__":
    main()