Spaces:

ardha27
/

Youtube-AI-Summarizer

Running

App Files Files Community

Zeph27 commited on Aug 16, 2024

Commit

b72617b

1 Parent(s): 40a56d1

update processing time

Browse files

Files changed (1) hide show

app.py +8 -7

app.py CHANGED Viewed

@@ -67,6 +67,7 @@ def summarize_transcription(transcription, model, gemini_prompt):
 @spaces.GPU(duration=120)
 def process_audio(audio_file, language, whisper_model):
     print("Starting transcription...")
     if device == 0:
         pipe = load_pipeline(whisper_model)
@@ -85,10 +86,12 @@ def process_audio(audio_file, language, whisper_model):
     else:
         print("No language defined, using default language")
         transcription = pipe(inputs, batch_size=8, generate_kwargs={"task": "transcribe"}, return_timestamps=True)["text"]
-    return transcription
 def transcribe(youtube_url, audio_file, whisper_model, gemini_api_key, gemini_prompt, gemini_model_variant, language, progress=gr.Progress()):
-    start_time = time.time()
     try:
         progress(0, desc="Initializing")
         if not gemini_api_key:
@@ -112,7 +115,7 @@ def transcribe(youtube_url, audio_file, whisper_model, gemini_api_key, gemini_pr
             print(f"Audio file read: {audio_file}")
         progress(0.4, desc="Starting transcription")
-        transcription = process_audio(audio_file, language, whisper_model)
         progress(0.6, desc="Cleaning up")
         # Delete the audio file after transcription
@@ -142,9 +145,7 @@ def transcribe(youtube_url, audio_file, whisper_model, gemini_api_key, gemini_pr
         progress(1, desc="Complete")
         print("Transcription and summarization complete.")
-        end_time = time.time()
-        total_time = round(end_time - start_time, 2)
-        return transcription_message, summary_message, transcription_file, summary_file, total_time
     except gr.Error as e:
         # Re-raise Gradio errors
         raise e
@@ -187,7 +188,7 @@ with gr.Blocks(theme='NoCrypt/miku') as demo:
             summary_output = gr.Textbox(label="Summary Output")
         transcription_file = gr.File(label="Download Transcription")
         summary_file = gr.File(label="Download Summary")
-        processing_time = gr.Textbox(label="Total Processing Time (seconds)")
     input_type.change(fn=toggle_input, inputs=input_type, outputs=[youtube_url, audio_file])
     define_language.change(fn=toggle_language, inputs=define_language, outputs=[language])

 @spaces.GPU(duration=120)
 def process_audio(audio_file, language, whisper_model):
     print("Starting transcription...")
+    start_time = time.time()
     if device == 0:
         pipe = load_pipeline(whisper_model)
     else:
         print("No language defined, using default language")
         transcription = pipe(inputs, batch_size=8, generate_kwargs={"task": "transcribe"}, return_timestamps=True)["text"]
+    end_time = time.time()
+    processing_time = round(end_time - start_time, 2)
+    return transcription, processing_time
 def transcribe(youtube_url, audio_file, whisper_model, gemini_api_key, gemini_prompt, gemini_model_variant, language, progress=gr.Progress()):
     try:
         progress(0, desc="Initializing")
         if not gemini_api_key:
             print(f"Audio file read: {audio_file}")
         progress(0.4, desc="Starting transcription")
+        transcription, processing_time = process_audio(audio_file, language, whisper_model)
         progress(0.6, desc="Cleaning up")
         # Delete the audio file after transcription
         progress(1, desc="Complete")
         print("Transcription and summarization complete.")
+        return transcription_message, summary_message, transcription_file, summary_file, processing_time
     except gr.Error as e:
         # Re-raise Gradio errors
         raise e
             summary_output = gr.Textbox(label="Summary Output")
         transcription_file = gr.File(label="Download Transcription")
         summary_file = gr.File(label="Download Summary")
+        processing_time = gr.Textbox(label="Transcription Processing Time (seconds)")
     input_type.change(fn=toggle_input, inputs=input_type, outputs=[youtube_url, audio_file])
     define_language.change(fn=toggle_language, inputs=define_language, outputs=[language])