Spaces:

mazalaai
/

tts

Sleeping

App Files Files Community

MAZALA2024 commited on Oct 13, 2024

Commit

8d4ed80

verified ·

1 Parent(s): 32fb87d

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -14

app.py CHANGED Viewed

@@ -2,27 +2,29 @@ import gradio as gr
 import base64
 import numpy as np
 from scipy.io import wavfile
-from voice_processing import tts, get_model_names, voice_mapping
 from io import BytesIO
-def convert_tts(model_name, tts_text, selected_voice, slang_rate, use_uploaded_voice, voice_upload):
     edge_tts_voice = voice_mapping.get(selected_voice)
     if not edge_tts_voice:
         return {"error": f"Invalid voice '{selected_voice}'."}, None
     voice_upload_file = None
     if use_uploaded_voice and voice_upload is not None:
-        voice_upload_file = voice_upload.read()
-    # Call the tts processing function
-    result = tts(
         model_name, tts_text, edge_tts_voice, slang_rate, use_uploaded_voice, voice_upload_file
     )
-    if isinstance(result, dict) and "error" in result:
-        return result, None
-    info, _, (tgt_sr, audio_output) = result
     # Process audio output to bytes
     audio_bytes = None
@@ -47,9 +49,9 @@ def get_voices():
 iface = gr.Interface(
     fn=convert_tts,
     inputs=[
-        gr.Dropdown(choices=get_models(), label="Model"),
         gr.Textbox(label="Text", placeholder="Enter text here"),
-        gr.Dropdown(choices=get_voices(), label="Voice"),
         gr.Slider(minimum=0, maximum=1, step=0.01, label="Slang Rate"),
         gr.Checkbox(label="Use Uploaded Voice"),
         gr.File(label="Voice File")
@@ -59,8 +61,7 @@ iface = gr.Interface(
         gr.Textbox(label="Audio URI")
     ],
     title="Text-to-Speech Conversion"
-    # Remove or comment out concurrency parameters not supported in Gradio 4.36.0
 )
 # Launch the interface
-iface.launch(debug=True, show_error=True)

 import base64
 import numpy as np
 from scipy.io import wavfile
+from voice_processing import parallel_tts, get_model_names, voice_mapping
 from io import BytesIO
+import asyncio  # Import asyncio
+# Define an asynchronous function for the Gradio interface
+async def convert_tts(model_name, tts_text, selected_voice, slang_rate, use_uploaded_voice, voice_upload):
     edge_tts_voice = voice_mapping.get(selected_voice)
     if not edge_tts_voice:
         return {"error": f"Invalid voice '{selected_voice}'."}, None
     voice_upload_file = None
     if use_uploaded_voice and voice_upload is not None:
+        with open(voice_upload.name, 'rb') as f:
+            voice_upload_file = f.read()
+    # Create task for parallel processing
+    task = (
         model_name, tts_text, edge_tts_voice, slang_rate, use_uploaded_voice, voice_upload_file
     )
+    # Asynchronous call to your tts processing function using parallel processing
+    result = await asyncio.get_event_loop().run_in_executor(None, parallel_tts, [task])
+    info, _, (tgt_sr, audio_output) = result[0]
     # Process audio output to bytes
     audio_bytes = None
 iface = gr.Interface(
     fn=convert_tts,
     inputs=[
+        gr.Dropdown(choices=get_models(), label="Model", interactive=True),
         gr.Textbox(label="Text", placeholder="Enter text here"),
+        gr.Dropdown(choices=get_voices(), label="Voice", interactive=True),
         gr.Slider(minimum=0, maximum=1, step=0.01, label="Slang Rate"),
         gr.Checkbox(label="Use Uploaded Voice"),
         gr.File(label="Voice File")
         gr.Textbox(label="Audio URI")
     ],
     title="Text-to-Speech Conversion"
 )
 # Launch the interface
+iface.launch(debug=True)  # Set share=True to create a public link