File size: 953 Bytes
194fffd
 
 
 
 
33e0dc8
194fffd
 
 
 
33e0dc8
194fffd
 
 
 
 
 
 
 
 
 
33e0dc8
194fffd
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
import gradio as gr
from TTS.api import TTS

tts = TTS("tts_models/multilingual/multi-dataset/xtts_v1", gpu=True)

def predict(prompt, language, audio_file_pth):

    tts.tts_to_file(text=prompt,
                file_path="output.wav",
                speaker_wav=audio_file_pth,
                language=language)

    return gr.make_waveform(audio="output.wav",)


title = "XTTS: MVP"

gr.Interface(
    fn=predict,
    inputs=[
        gr.Textbox(label="Prompt", info = "One or two sentences at a time is better* (max: 10)", placeholder = "It took me quite a long time to develop a voice, and now that I have it I'm not going to be silent.",),
        gr.Dropdown(choices=["en", "es", "fr", "de", "it", "pt", "pl", "tr", "ru", "nl", "cz", "ar", "zh"], max_choices=1),        
        gr.Audio(label="Upload Speaker WAV", type="filepath"),
    ],
    outputs=[
        gr.Video(label="Synthesised Speech"),
    ],
    title=title,
).launch(debug=True)