Spaces:

gauravgulati619
/

MediVox

Running

gauravgulati619 commited on 15 days ago

Commit

9943a83

1 Parent(s): cc751de

Fix: Update audio handling in Gradio interface

Files changed (2) hide show

.gitignore CHANGED Viewed

@@ -10,7 +10,7 @@ __pycache__/
 *.wav
 *.jpg
 download.jpg
-Temp.mp3
 final.mp3
 patient_voice.mp3

 *.wav
 *.jpg
 download.jpg
+output_audio.mp3
 final.mp3
 patient_voice.mp3

app.py CHANGED Viewed

@@ -130,9 +130,11 @@ def process_inputs(audio_filepath, image_filepath):
     else:
         doctor_response = "No image provided for me to analyze"
-    voice_of_doctor = text_to_speech_with_elevenlabs(input_text=doctor_response, output_filepath="final.mp3")
-    return speech_to_text_output, doctor_response, voice_of_doctor
 # Create the interface
@@ -145,7 +147,7 @@ iface = gr.Interface(
     outputs=[
         gr.Textbox(label="Speech to Text"),
         gr.Textbox(label="Doctor's Response"),
-        gr.Audio("Temp.mp3")
     ],
     title="AI Doctor with Vision and Voice"
 )

     else:
         doctor_response = "No image provided for me to analyze"
+    # Generate audio response and return the filepath
+    output_filepath = "output_audio.mp3"
+    voice_of_doctor = text_to_speech_with_elevenlabs(input_text=doctor_response, output_filepath=output_filepath)
+    return speech_to_text_output, doctor_response, output_filepath
 # Create the interface
     outputs=[
         gr.Textbox(label="Speech to Text"),
         gr.Textbox(label="Doctor's Response"),
+        gr.Audio(label="Doctor's Voice")
     ],
     title="AI Doctor with Vision and Voice"
 )