Update app.py
Browse files
app.py
CHANGED
@@ -45,20 +45,21 @@ css="""
|
|
45 |
title="""
|
46 |
<div style="text-align: center;">
|
47 |
<h1>Voice Cloning for Bark Text-to-Audio</h1>
|
48 |
-
<p>This demo is an adaptation of the <a href="https://github.com/serp-ai/bark-with-voice-clone" target="_blank">Serp-AI</a
|
|
|
49 |
</div>
|
50 |
"""
|
51 |
|
52 |
with gr.Blocks(css=css) as demo:
|
53 |
with gr.Column(elem_id="col-container"):
|
54 |
gr.HTML(title)
|
55 |
-
audio_in = gr.Audio(label="Voice in to clone",
|
56 |
-
transcript = gr.Textbox(label="Manual transcription of your audio")
|
57 |
name = gr.Textbox(label="Name your voice")
|
58 |
|
59 |
generate_btn = gr.Button("Clone voice !")
|
60 |
|
61 |
-
npz_file = gr.File(label=".npz file"
|
62 |
|
63 |
generate_btn.click(clone_voice, inputs=[audio_in, name, transcript], outputs=[npz_file])
|
64 |
|
|
|
45 |
title="""
|
46 |
<div style="text-align: center;">
|
47 |
<h1>Voice Cloning for Bark Text-to-Audio</h1>
|
48 |
+
<p>This demo is an adaptation of the <a href="https://github.com/serp-ai/bark-with-voice-clone" target="_blank">Serp-AI</a> attempts to enable voice cloning using Bark</p>
|
49 |
+
<p>If you want to generate audio from text with this npz file, follow the generate.ipynb notebook you will find at the Serp-AI Bark clone repo.</p>
|
50 |
</div>
|
51 |
"""
|
52 |
|
53 |
with gr.Blocks(css=css) as demo:
|
54 |
with gr.Column(elem_id="col-container"):
|
55 |
gr.HTML(title)
|
56 |
+
audio_in = gr.Audio(label="Voice in to clone", source="microphone", type="filepath")
|
57 |
+
transcript = gr.Textbox(label="Manual transcription of your audio", info="the audio you want to clone (will get truncated so 5-10 seconds is probably fine, existing samples that I checked are around 7 seconds), then you'll need to manually transcript your audio below:")
|
58 |
name = gr.Textbox(label="Name your voice")
|
59 |
|
60 |
generate_btn = gr.Button("Clone voice !")
|
61 |
|
62 |
+
npz_file = gr.File(label=".npz file")
|
63 |
|
64 |
generate_btn.click(clone_voice, inputs=[audio_in, name, transcript], outputs=[npz_file])
|
65 |
|