Voice-Cloning-for-YouTube

Runtime error

App Files Files Community

kevinwang676 commited on Oct 2, 2023

Commit

bc01a52

1 Parent(s): c48b863

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -66

app.py CHANGED Viewed

@@ -208,79 +208,27 @@ def predict_song_from_yt(
 description = f"""
-## <center>🏞️ - 滔滔AI，为您提供全场景的AI声音服务（如AI拟声、AI歌手、AI变声等）</center>
-### <center>🌟 - 滔滔AI合作音乐人：[一清清清](https://space.bilibili.com/22960772?spm_id_from=333.337.0.0)；AI歌手，唱我想唱！</center>
-### <center>🎡 - 更多精彩，尽在[滔滔AI](http://www.talktalkai.com)；合作：talktalkai.kevin@gmail.com</center>
-<center>💡 - 如何使用此程序：在页面上方选择“从B站视频上传”模块，填写视频网址和视频起止时间后，点击“submit”按键即可！您还可以点击页面最下方的示例快速预览效果</center>
-<h1 align="center"><a href="http://www.talktalkai.com"><img src="https://y.qq.com/music/photo_new/T001R300x300M0000025Gr0r2OXvrn_2.jpg", alt="talktalkai" border="0" style="margin: 0 auto; height: 200px;" /></a> </h1>
-""".strip()
-article = """
-<p style='text-align: center'> 注意❗：请不要生成会对个人以及组织造成侵害的内容，此程序仅供科研、学习及个人娱乐使用。
-</p>
-<p style='text-align: center'> 🌊🎶🏞️ - 江水东流急，滔滔无尽声。 明·顾璘
-</p>
 """.strip()
-interface_mic = gr.Interface(
-    predict,
-    inputs=[
-        gr.Dropdown(speakers, value=speakers[0], label="🎤AI歌手🎶 - 🌟一清清清🌟"),
-        gr.Audio(type="filepath", source="microphone", label="请用麦克风上传您想转换的歌曲"),
-        gr.Slider(-12, 12, value=0, step=1, label="变调 (默认为0；有正负值，+2为升高两个key)"),
-        gr.Checkbox(False, label="是否开启自动f0预测", info="勾选即为开启；配合聚类模型f0预测效果更好，仅限语音转换时使用", visible=False),
-        gr.Slider(0.0, 1.0, value=default_cluster_infer_ratio, step=0.1, label="聚类模型混合比例", info="0-1之间，0即不启用聚类。使用聚类模型能提升音色相似度，但会导致咬字下降 (如果使用，建议0.5左右)"),
-        gr.Slider(0.0, 1.0, value=0.4, step=0.1, label="noise scale (建议保持不变)", visible=False),
-        gr.Dropdown(
-            choices=["crepe", "crepe-tiny", "parselmouth", "dio", "harvest"],
-            value=default_f0_method,
-            label="模型推理方法 (crepe推理效果最好)", visible=False
-        ),
-    ],
-    outputs="audio",
-    title="🌊💕🎶 - 滔滔AI+音乐：可从B站直接上传素材，无需分离背景音",
-    description=description,
-    article=article,
-)
-interface_file = gr.Interface(
-    predict,
-    inputs=[
-        gr.Dropdown(speakers, value=speakers[0], label="🎤AI歌手🎶 - 🌟一清清清🌟"),
-        gr.Audio(type="filepath", source="upload", label="请上传您想转换的歌曲 (仅人声部分)"),
-        gr.Slider(-12, 12, value=0, step=1, label="变调 (默认为0；有正负值，+2为升高两个key)"),
-        gr.Checkbox(False, label="是否开启自动f0预测", info="勾选即为开启；配合聚类模型f0预测效果更好，仅限语音转换时使用", visible=False),
-        gr.Slider(0.0, 1.0, value=default_cluster_infer_ratio, step=0.1, label="聚类模型混合比例", info="0-1之间，0即不启用聚类。使用聚类模型能提升音色相似度，但会导致咬字下降 (如果使用，建议0.5左右)"),
-        gr.Slider(0.0, 1.0, value=0.4, step=0.1, label="noise scale (建议保持不变)", visible=False),
-        gr.Dropdown(
-            choices=["crepe", "crepe-tiny", "parselmouth", "dio", "harvest"],
-            value=default_f0_method,
-            label="模型推理方法 (crepe推理效果最好)", visible=False
-        ),
-    ],
-    outputs="audio",
-    title="🌊💕🎶 - 滔滔AI+音乐：可从B站直接上传素材，无需分离背景音",
-    description=description,
-    article=article,
-)
 interface_yt = gr.Interface(
     predict_song_from_yt,
     inputs=[
         gr.Textbox(
-            label="Bilibili网址", info="请填写含有您喜欢歌曲的Bilibili网址，可直接填写相应的BV号", value="https://www.bilibili.com/video/BV..."
         ),
-        gr.Number(value=0, label="起始时间 (秒)"),
-        gr.Number(value=15, label="结束时间 (秒)"),
-        gr.Dropdown(speakers, value=speakers[0], label="🎤AI歌手🎶 - 🌟一清清清🌟"),
-        gr.Slider(-12, 12, value=0, step=1, label="变调 (默认为0；有正负值，+2为升高两个key)"),
         gr.Checkbox(False, label="是否开启自动f0预测", info="勾选即为开启；配合聚类模型f0预测效果更好，仅限语音转换时使用", visible=False),
-        gr.Slider(0.0, 1.0, value=default_cluster_infer_ratio, step=0.1, label="聚类模型混合比例", info="0-1之间，0即不启用聚类。使用聚类模型能提升音色相似度，但会导致咬字下降"),
         gr.Slider(0.0, 1.0, value=0.4, step=0.1, label="noise scale (建议保持不变)", visible=False),
         gr.Dropdown(
             choices=["crepe", "crepe-tiny", "parselmouth", "dio", "harvest"],
@@ -288,17 +236,17 @@ interface_yt = gr.Interface(
             label="模型推理方法 (crepe推理效果最好)", visible=False
         ),
     ],
-    outputs=[gr.Audio(label="AI歌手+伴奏🎵"), gr.Audio(label="AI歌手人声部分🎤")],
-    title="🌊💕🎶 - 滔滔AI+音乐：可从B站直接上传素材，无需分离背景音",
     description=description,
     article=article,
     examples=[
-        ["https://www.bilibili.com/video/BV1ip4y1p7Pn", 87, 103, speakers[0], 0, False, default_cluster_infer_ratio, 0.4, default_f0_method],
     ],
 )
 interface = gr.TabbedInterface(
-    [interface_yt, interface_mic, interface_file],
-    ["📺 - 从B站视频上传 ⭐推荐⭐", "🎙️ - 从麦克风上传", "🎵 - 从文件上传"],
 )

 description = f"""
+## <center>🏞️ - TalkTalkAI - Generative AI Text to Speech & Singing Voice Cloning</center>
+### <center>🌟 - The singer who collaborates with TalkTalkAI[一清清清](https://space.bilibili.com/22960772?spm_id_from=333.337.0.0)</center>
+### <center>🤗 - Stay tuned. The best is yet to come. Contact us: talktalkai.kevin@gmail.com</center>
 """.strip()
 interface_yt = gr.Interface(
     predict_song_from_yt,
     inputs=[
         gr.Textbox(
+            label="YouTube URL or ID", info="A YouTube URL (or ID) to a song on YouTube you want to clone from"
         ),
+        gr.Number(value=0, label="Start Time (seconds)"),
+        gr.Number(value=15, label="End Time (seconds)"),
+        gr.Dropdown(speakers, value=speakers[0], label="🎤 AI Singer"),
+        gr.Slider(-12, 12, value=0, step=1, label="Transpose (Semitones)"),
         gr.Checkbox(False, label="是否开启自动f0预测", info="勾选即为开启；配合聚类模型f0预测效果更好，仅限语音转换时使用", visible=False),
+        gr.Slider(0.0, 1.0, value=default_cluster_infer_ratio, step=0.1, label="聚类模型混合比例", info="0-1之间，0即不启用聚类。使用聚类模型能提升音色相似度，但会导致咬字下降", visible=False),
         gr.Slider(0.0, 1.0, value=0.4, step=0.1, label="noise scale (建议保持不变)", visible=False),
         gr.Dropdown(
             choices=["crepe", "crepe-tiny", "parselmouth", "dio", "harvest"],
             label="模型推理方法 (crepe推理效果最好)", visible=False
         ),
     ],
+    outputs=[gr.Audio(label="With BGM🎵"), gr.Audio(label="Without BGM🎤")],
+    title="🌊💕🎶 - TalkTalkAI",
     description=description,
     article=article,
     examples=[
+        ["https://www.youtube.com/watch?v=cn4M-fH08XY", 0, 11, speakers[0], 0, False, default_cluster_infer_ratio, 0.4, default_f0_method],
     ],
 )
 interface = gr.TabbedInterface(
+    [interface_yt],
+    ["📺 - Clone Song From YouTube],
 )