clone

Build error

App Files Files Community

poemsforaphrodite commited on Aug 28, 2024

Commit

88f7073

verified ·

1 Parent(s): 390fe1a

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -26

app.py CHANGED Viewed

@@ -1,4 +1,4 @@
-import streamlit as st
 import torch
 from TTS.api import TTS
 import os
@@ -9,7 +9,6 @@ os.environ["COQUI_TOS_AGREED"] = "1"
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Initialize TTS model
-@st.cache_resource
 def load_tts_model():
     return TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
@@ -32,30 +31,30 @@ def clone(text, audio_file, language, speaking_rate, pitch, volume,
     return temp_audio_path
-st.title('Advanced Voice Clone')
-st.write('Customize your voice cloning experience with various parameters.')
-text = st.text_area('Text')
-audio_file = st.file_uploader('Voice reference audio file', type=['wav', 'mp3'])
-language = st.selectbox('Language', ["en", "es", "fr", "de", "it"], index=0)
-speaking_rate = st.slider('Speaking Rate', 0.5, 2.0, 1.0)
-pitch = st.slider('Pitch Adjustment', -10, 10, 0)
-volume = st.slider('Volume', 0.1, 2.0, 1.0)
-emotion = st.selectbox('Emotion', ["neutral", "happy", "sad", "angry"], index=0)
-sample_rate = st.selectbox('Sample Rate', [22050, 24000, 44100, 48000], index=1)
-temperature = st.slider('Temperature', 0.1, 1.0, 0.8)
-seed = st.number_input('Seed (optional)', value=None)
-if st.button('Generate'):
-    if text and audio_file:
-        with st.spinner('Generating audio...'):
-            output_path = clone(text, audio_file, language, speaking_rate, pitch, volume,
-                                emotion, sample_rate, temperature, seed)
-            st.audio(output_path)
-    else:
-        st.warning('Please provide both text and a voice reference audio file.')
-# Clean up temporary files
 for file in os.listdir():
     if file.endswith('.wav') and file.startswith('tmp'):
         os.remove(file)

+import gradio as gr
 import torch
 from TTS.api import TTS
 import os
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Initialize TTS model
 def load_tts_model():
     return TTS("tts_models/multilingual/multi-dataset/xtts_v2").to(device)
     return temp_audio_path
+# Define Gradio interface
+iface = gr.Interface(
+    fn=clone,
+    inputs=[
+        gr.Textbox(label="Text"),
+        gr.Audio(label="Voice reference audio file", type="filepath"),
+        gr.Dropdown(["en", "es", "fr", "de", "it"], label="Language", value="en"),
+        gr.Slider(0.5, 2.0, value=1.0, label="Speaking Rate"),
+        gr.Slider(-10, 10, value=0, label="Pitch Adjustment"),
+        gr.Slider(0.1, 2.0, value=1.0, label="Volume"),
+        gr.Dropdown(["neutral", "happy", "sad", "angry"], label="Emotion", value="neutral"),
+        gr.Dropdown([22050, 24000, 44100, 48000], label="Sample Rate", value=24000),
+        gr.Slider(0.1, 1.0, value=0.8, label="Temperature"),
+        gr.Number(label="Seed (optional)")
+    ],
+    outputs=gr.Audio(label="Generated Audio"),
+    title="Advanced Voice Clone",
+    description="Customize your voice cloning experience with various parameters."
+)
+# Launch the interface
+iface.launch()
+# Clean up temporary files (this will run after the Gradio server is closed)
 for file in os.listdir():
     if file.endswith('.wav') and file.startswith('tmp'):
         os.remove(file)