Spaces:

nakas
/

Time-Domain-Audio-Style-Transfer

Runtime error

nakas commited on Nov 14, 2022

Commit

1f1c84d

1 Parent(s): e66b829

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,7 +4,20 @@ from audio_style_transfer.models import timedomain
 def audioStyleTransfer(content,style):
     print (style,content)
     output = "/tmp/outputfile.wav"
-    timedomain.run( style_fname=style, content_fname=content ,output_fname=output)
     print ("output is " ,output)
     return  output

 def audioStyleTransfer(content,style):
     print (style,content)
     output = "/tmp/outputfile.wav"
+    sr = librosa.get_samplerate(content)
+    timedomain.run( style_fname=style,
+        content_fname=content,
+        output_fname=output,
+        norm=False,
+        n_fft=8192,          # 512 to sr / 2. Higher is better quality but is slower.
+        n_layers=2,          # 1 to 3. Higher is better quality but is slower.
+        n_filters=4096,      # 512 - 4096. Higher is better quality but is slower.
+        hop_length=256,      # 256 to n_fft / 2. The lower this value, the better the temporal resolution.
+        alpha=0.0005,        # 0.0001 to 0.01. The higher this value, the more of the original "content" bleeds
+        k_w=4,               # 3 to 5. The higher this value, the more complex the patterns it can synthesize.
+        iterations=300,      # 100 to 1000. Higher is better quality but is slower.
+        stride=1,            # 1 to 3. Lower is better quality but is slower.
+        sr=sr)
     print ("output is " ,output)
     return  output