Spaces:

lingy
/

my-asr

Sleeping

App Files Files Community

Ubuntu commited on Oct 1

Commit

0566ea1

•

1 Parent(s): 75f8860

add whisper v3 support

Browse files

Files changed (1) hide show

app.py +11 -3

app.py CHANGED Viewed

@@ -69,7 +69,7 @@ def download_youtube_audio(youtube_url: str, output_dir: Optional[str] = None) -
         print("Error:", response.status_code, response.text)
         return None  # Return None on failure
-def run_asr(audio_file, youtube_url, with_timestamp):
     temp_file = None
     try:
         if youtube_url:
@@ -80,7 +80,14 @@ def run_asr(audio_file, youtube_url, with_timestamp):
             return "Please provide either an audio file or a YouTube URL."
         files = {'file': open(audio_file, 'rb')}
-        data = {'language': 'en', 'model_name': 'whisper-large-v2-imda', 'with_timestamp': with_timestamp}
         response = requests.post(f"{API_URL}/asr", data=data, files=files)
         if response.status_code == 200:
@@ -120,6 +127,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
             youtube_input = gr.Textbox(label="YouTube URL", placeholder="Or paste a YouTube URL here...")
             video_player = gr.HTML(visible=False)
             timestamp_toggle = gr.Checkbox(label="Include Timestamps", value=False)
         with gr.Column(scale=3):
             result = gr.Textbox(
                 label="Transcription Result",
@@ -128,7 +136,7 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
             )
     run_button = gr.Button("🚀 Transcribe Audio", variant="primary")
-    run_button.click(run_asr, inputs=[audio_input, youtube_input, timestamp_toggle], outputs=[result])
     # Update video player and clear transcription and audio input when YouTube URL is entered
     youtube_input.change(

         print("Error:", response.status_code, response.text)
         return None  # Return None on failure
+def run_asr(audio_file, youtube_url, with_timestamp, model_choice):
     temp_file = None
     try:
         if youtube_url:
             return "Please provide either an audio file or a YouTube URL."
         files = {'file': open(audio_file, 'rb')}
+        # Update model_name based on the user's choice
+        if model_choice == "whisper_v3":
+            model_name = "official_v3"
+        else:
+            model_name = "whisper-large-v2-imda"
+        data = {'language': 'en', 'model_name': model_name, 'with_timestamp': with_timestamp}
         response = requests.post(f"{API_URL}/asr", data=data, files=files)
         if response.status_code == 200:
             youtube_input = gr.Textbox(label="YouTube URL", placeholder="Or paste a YouTube URL here...")
             video_player = gr.HTML(visible=False)
             timestamp_toggle = gr.Checkbox(label="Include Timestamps", value=False)
+            model_choice = gr.Radio(["local_whisper", "whisper_v3"], label="Model Selection", value="local_whisper")
         with gr.Column(scale=3):
             result = gr.Textbox(
                 label="Transcription Result",
             )
     run_button = gr.Button("🚀 Transcribe Audio", variant="primary")
+    run_button.click(run_asr, inputs=[audio_input, youtube_input, timestamp_toggle, model_choice], outputs=[result])
     # Update video player and clear transcription and audio input when YouTube URL is entered
     youtube_input.change(