Spaces:

innnky
/

soft-vits-singingvc

Runtime error

rcell commited on Sep 13, 2022

Commit

99185bb

•

1 Parent(s): f5d0e3c

fix

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,7 +9,7 @@ numba_logger.setLevel(logging.WARNING)
 import librosa
 import torch
-import torchcrepe
 import commons
 import utils
 from models import SynthesizerTrn
@@ -19,14 +19,15 @@ def resize2d(source, target_len):
     source[source<0.001] = np.nan
     target = np.interp(np.arange(0, len(source)*target_len, len(source))/ target_len, np.arange(0, len(source)), source)
     return np.nan_to_num(target)
 def convert_wav_22050_to_f0(audio):
-    tmp = torchcrepe.predict(audio=audio, fmin=50, fmax=550,
-                             sample_rate=22050, model='full',
-                             batch_size=2048).numpy()[0]
     f0 = np.zeros_like(tmp)
-    f0[tmp > 0] = tmp[tmp > 0]
     return f0
 def get_text(text, hps):
     text_norm = text_to_sequence(text, hps.data.text_cleaners)
     if hps.data.add_blank:

 import librosa
 import torch
 import commons
 import utils
 from models import SynthesizerTrn
     source[source<0.001] = np.nan
     target = np.interp(np.arange(0, len(source)*target_len, len(source))/ target_len, np.arange(0, len(source)), source)
     return np.nan_to_num(target)
 def convert_wav_22050_to_f0(audio):
+    tmp = librosa.pyin(audio,
+                fmin=librosa.note_to_hz('C0'),
+                fmax=librosa.note_to_hz('C7'),
+                frame_length=1780)[0]
     f0 = np.zeros_like(tmp)
+    f0[tmp>0] = tmp[tmp>0]
     return f0
 def get_text(text, hps):
     text_norm = text_to_sequence(text, hps.data.text_cleaners)
     if hps.data.add_blank: