frogcho123 commited on
Commit
d195d40
1 Parent(s): cc4c3a2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +16 -6
app.py CHANGED
@@ -3,6 +3,7 @@ import os
3
  import whisper
4
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
5
  from gtts import gTTS
 
6
 
7
  # Load models
8
  model_stt = whisper.load_model("base")
@@ -36,13 +37,22 @@ def speech_to_speech(input_audio, to_lang):
36
  output_file = "output_audio.mp3"
37
  tts.save(output_file)
38
 
39
- return output_file
 
 
 
40
 
41
  languages = ["ru", "fr", "es", "de"] # Example languages: Russian, French, Spanish, German
42
- file_input = gr.inputs.File(label="Upload Audio")
43
  dropdown = gr.inputs.Dropdown(languages, label="Translation Language")
44
- audio_output = gr.outputs.Audio(label="Translated Voice")
45
-
46
-
47
- gr.Interface(fn=speech_to_speech, inputs=[file_input, dropdown], outputs=audio_output, title="Speech-to-Speech Translator", description="Upload an audio file (MP3, WAV, or FLAC) and choose the target language for translation.", theme="default").launch()
 
 
 
 
 
 
48
 
 
3
  import whisper
4
  from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
5
  from gtts import gTTS
6
+ import numpy as np
7
 
8
  # Load models
9
  model_stt = whisper.load_model("base")
 
37
  output_file = "output_audio.mp3"
38
  tts.save(output_file)
39
 
40
+ # Load output audio as numpy array
41
+ audio_np = np.array(output_file)
42
+
43
+ return audio_np
44
 
45
  languages = ["ru", "fr", "es", "de"] # Example languages: Russian, French, Spanish, German
46
+ file_input = gr.inputs.File(label="Upload Audio", accept="audio/*")
47
  dropdown = gr.inputs.Dropdown(languages, label="Translation Language")
48
+ audio_output = gr.outputs.Audio(label="Translated Voice", type="numpy")
49
+
50
+ gr.Interface(
51
+ fn=speech_to_speech,
52
+ inputs=[file_input, dropdown],
53
+ outputs=audio_output,
54
+ title="Speech-to-Speech Translator",
55
+ description="Upload an audio file (MP3, WAV, or FLAC) and choose the target language for translation.",
56
+ theme="default"
57
+ ).launch()
58