kevinwang676
commited on
Commit
Β·
16ddf32
1
Parent(s):
c09fd29
Update app.py
Browse files
app.py
CHANGED
@@ -22,14 +22,6 @@ import numpy as np
|
|
22 |
# from IPython.display import Audio
|
23 |
|
24 |
import torch
|
25 |
-
import torchaudio
|
26 |
-
from speechbrain.pretrained import SpectralMaskEnhancement
|
27 |
-
|
28 |
-
enhance_model = SpectralMaskEnhancement.from_hparams(
|
29 |
-
source="speechbrain/metricgan-plus-voicebank",
|
30 |
-
savedir="pretrained_models/metricgan-plus-voicebank",
|
31 |
-
run_opts={"device":"cuda"},
|
32 |
-
)
|
33 |
|
34 |
from TTS.tts.utils.synthesis import synthesis
|
35 |
from TTS.tts.utils.text.symbols import make_symbols, phonemes, symbols
|
@@ -171,15 +163,7 @@ def voice_conversion(ta, ra, da):
|
|
171 |
# print("Reference Audio after decoder:")
|
172 |
# IPython.display.display(Audio(ref_wav_voc, rate=ap.sample_rate))
|
173 |
|
174 |
-
|
175 |
-
ref_wav_voc
|
176 |
-
).unsqueeze(0)
|
177 |
-
|
178 |
-
enhanced = enhance_model.enhance_batch(noisy, lengths=torch.tensor([1.]))
|
179 |
-
torchaudio.save("enhanced.wav", enhanced.cpu(), 16000)
|
180 |
-
|
181 |
-
return "enhanced.wav"
|
182 |
-
|
183 |
|
184 |
def generate_text_to_speech(text_prompt, selected_speaker, text_temp, waveform_temp):
|
185 |
audio_array = generate_audio(text_prompt, selected_speaker, text_temp, waveform_temp)
|
@@ -262,7 +246,7 @@ with gr.Blocks() as demo:
|
|
262 |
)
|
263 |
gr.Markdown(
|
264 |
"""
|
265 |
-
|
266 |
## π Foreign Language
|
267 |
Bark supports various languages out-of-the-box and automatically determines language from input text. \
|
268 |
When prompted with code-switched text, Bark will even attempt to employ the native accent for the respective languages in the same voice.
|
|
|
22 |
# from IPython.display import Audio
|
23 |
|
24 |
import torch
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
|
26 |
from TTS.tts.utils.synthesis import synthesis
|
27 |
from TTS.tts.utils.text.symbols import make_symbols, phonemes, symbols
|
|
|
163 |
# print("Reference Audio after decoder:")
|
164 |
# IPython.display.display(Audio(ref_wav_voc, rate=ap.sample_rate))
|
165 |
|
166 |
+
return (ap.sample_rate, ref_wav_voc)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
167 |
|
168 |
def generate_text_to_speech(text_prompt, selected_speaker, text_temp, waveform_temp):
|
169 |
audio_array = generate_audio(text_prompt, selected_speaker, text_temp, waveform_temp)
|
|
|
246 |
)
|
247 |
gr.Markdown(
|
248 |
"""
|
249 |
+
## π - You may also apply [VoiceFixer](https://huggingface.co/spaces/Kevin676/VoiceFixer) to the generated audio in order to enhance the speech.
|
250 |
## π Foreign Language
|
251 |
Bark supports various languages out-of-the-box and automatically determines language from input text. \
|
252 |
When prompted with code-switched text, Bark will even attempt to employ the native accent for the respective languages in the same voice.
|