rvc-models

Build error

App Files Files Community

Nick1 commited on Jan 20

Commit

c156672

verified ·

1 Parent(s): 819b637

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -3

app.py CHANGED Viewed

@@ -91,12 +91,12 @@ def create_vc_fn(model_name, tgt_sr, net_g, vc, if_f0, version, file_index):
                     return "You need to upload an audio", None
                 sampling_rate, audio = vc_upload
                 duration = audio.shape[0] / sampling_rate
-                if duration > 90 and spaces:
                     return "Please upload an audio file that is less than 90 seconds. If you need to generate a longer audio file, please use Colab.", None
                 audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
                 if len(audio.shape) > 1:
                     audio = librosa.to_mono(audio.transpose(1, 0))
-                if sampling_rate != 1600000:
                     audio = librosa.resample(audio, orig_sr=sampling_rate, target_sr=16000)
             elif vc_audio_mode == "TTS Audio":
                 if len(tts_text) > 100 and spaces:
@@ -106,7 +106,7 @@ def create_vc_fn(model_name, tgt_sr, net_g, vc, if_f0, version, file_index):
                 os.makedirs("output", exist_ok=True)
                 os.makedirs(os.path.join("output", "tts"), exist_ok=True)
                 asyncio.run(edge_tts.Communicate(tts_text, "-".join(tts_voice.split('-')[:-1])).save(os.path.join("output", "tts", "tts.mp3")))
-                audio, sr = librosa.load(os.path.join("output", "tts", "tts.mp3"), sr=1600000, mono=True)
                 vc_input = os.path.join("output", "tts", "tts.mp3")
             times = [0, 0, 0]
             f0_up_key = int(f0_up_key)

                     return "You need to upload an audio", None
                 sampling_rate, audio = vc_upload
                 duration = audio.shape[0] / sampling_rate
+                if duration > 900 and spaces:
                     return "Please upload an audio file that is less than 90 seconds. If you need to generate a longer audio file, please use Colab.", None
                 audio = (audio / np.iinfo(audio.dtype).max).astype(np.float32)
                 if len(audio.shape) > 1:
                     audio = librosa.to_mono(audio.transpose(1, 0))
+                if sampling_rate != 16000:
                     audio = librosa.resample(audio, orig_sr=sampling_rate, target_sr=16000)
             elif vc_audio_mode == "TTS Audio":
                 if len(tts_text) > 100 and spaces:
                 os.makedirs("output", exist_ok=True)
                 os.makedirs(os.path.join("output", "tts"), exist_ok=True)
                 asyncio.run(edge_tts.Communicate(tts_text, "-".join(tts_voice.split('-')[:-1])).save(os.path.join("output", "tts", "tts.mp3")))
+                audio, sr = librosa.load(os.path.join("output", "tts", "tts.mp3"), sr=16000, mono=True)
                 vc_input = os.path.join("output", "tts", "tts.mp3")
             times = [0, 0, 0]
             f0_up_key = int(f0_up_key)