Spaces:

juanpy
/

videoresumen

Runtime error

App Files Files Community

juan-op commited on Jan 7, 2023

Commit

29eb72e

1 Parent(s): 9bd8643

App initializer

Browse files

Files changed (2) hide show

app.py +64 -0
requirements.txt +5 -0

app.py ADDED Viewed

	@@ -0,0 +1,64 @@

+from tempfile import TemporaryDirectory
+from pytube import YouTube
+import whisper
+from transformers import pipeline
+import gradio as gr
+def get_title(url: str) -> str:
+    """Returns the title of the YouTube video at the given URL."""
+    yt = YouTube(url)
+    return f"**{yt.title}**"
+def download_audio(url: str, path: str) -> None:
+    """Downloads the audio from the YouTube video at the given URL and saves it to the specified path."""
+    yt = YouTube(url)
+    audio = yt.streams.filter(only_audio=True).first()
+    audio.download(output_path=path, filename="a.mp4")
+def transcribe(path: str) -> list[str]:
+    """Transcribes the audio file at the given path and returns the text."""
+    model = whisper.load_model("base")
+    transcription = model.transcribe(path)["text"]
+    transcription_chunks = [transcription[i : i + 1000] for i in range(0, len(transcription), 1000)]
+    return transcription_chunks
+def summarize(transcription: list[str]) -> str:
+    """Summarizes the given text and returns the summary."""
+    model = pipeline("summarization")
+    summary_chunks = model(transcription, max_length=80, min_length=30)
+    summary = (" ".join([chunks["summary_text"] for chunks in summary_chunks]).strip().replace(" . ", ". "))
+    return summary
+def execute_pipeline(url: str) -> str:
+    """Generates a temporary directory and executes the pipeline to download, transcribe and summarize the video."""
+    with TemporaryDirectory(dir=".") as tmp_dir:
+        download_audio(url, tmp_dir)
+        result = transcribe(f"{tmp_dir}/a.mp4")
+        text = summarize(result)
+        print("Done!")
+        return text
+def main() -> None:
+    """Generates the Gradio interface."""
+    with gr.Blocks(analytics_enabled=True, title="Resume un video") as page:
+        gr.HTML('<h2 style="text-align:center"><span style="font-size:36px">Resume un video de <strong>Youtube</strong></span></h2>')
+        url = gr.Textbox(label="Introduce el link del video:")
+        title = gr.Markdown()
+        output = gr.Textbox(label="Resumen")
+        summarize_btn = gr.Button("Dale").style(full_width=False)
+        summarize_btn.click(fn=execute_pipeline, inputs=url, outputs=output)
+        summarize_btn.click(fn=get_title, inputs=url, outputs=title)
+        gr.Markdown("*Funciona mejor con vídeos en inglés y de menos de 10 minutos.*")
+    page.launch()
+if __name__ == "__main__":
+    main()

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+gradio==3.16.0
+pytube==12.1.2
+transformers==4.25.1
+whisper @ git+https://github.com/openai/whisper.git@28769fcfe50755a817ab922a7bc83483159600a9