Spaces:

frogcho123
/

speech2speech

Runtime error

frogcho123 commited on Jun 6, 2023

Commit

b2604a4

•

1 Parent(s): 0053c85

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,7 +4,7 @@ import gradio as gr
 import whisper
 from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 from gtts import gTTS
-from IPython.display import Audio
 # Load the models and tokenizer
 whisper_model = whisper.load_model("base")
@@ -40,7 +40,10 @@ def translate_audio(input_file, to_lang):
     # Load audio data from file
     audio_data = open(temp_output_file, "rb").read()
-    return Audio(audio_data)
 def translate_audio_interface(input_file, to_lang):
     return translate_audio(input_file, to_lang)
@@ -48,7 +51,7 @@ def translate_audio_interface(input_file, to_lang):
 iface = gr.Interface(
     fn=translate_audio_interface,
     inputs=["file", "text"],
-    outputs="audio",
     title="Audio Translation",
     description="Upload an MP3 file and select the target language for translation.",
     examples=[
@@ -57,4 +60,5 @@ iface = gr.Interface(
     ]
 )
-iface.launch(debug = True)

 import whisper
 from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 from gtts import gTTS
+import base64
 # Load the models and tokenizer
 whisper_model = whisper.load_model("base")
     # Load audio data from file
     audio_data = open(temp_output_file, "rb").read()
+    # Convert audio data to Base64 string
+    audio_base64 = base64.b64encode(audio_data).decode("utf-8")
+    return audio_base64
 def translate_audio_interface(input_file, to_lang):
     return translate_audio(input_file, to_lang)
 iface = gr.Interface(
     fn=translate_audio_interface,
     inputs=["file", "text"],
+    outputs="text",
     title="Audio Translation",
     description="Upload an MP3 file and select the target language for translation.",
     examples=[
     ]
 )
+iface.launch()