andre-coy commited on
Commit
96203aa
โ€ข
1 Parent(s): 107903d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -14
app.py CHANGED
@@ -14,10 +14,10 @@ vocoder = SpeechT5HifiGan.from_pretrained("microsoft/speecht5_hifigan")
14
 
15
  speaker_embeddings = {
16
  "BDL": "spkemb/triniFemale.npy",
17
- #"CLB": "spkemb/triniFemale.npy",
18
- #"KSP": "spkemb/triniFemale.npy",
19
- #"RMS": "spkemb/triniFemale.npy",
20
- #"SLT": "spkemb/triniFemale.npy",
21
  }
22
 
23
 
@@ -59,16 +59,16 @@ def predict(text, speaker):
59
 
60
  title = "SpeechT5: Speech Synthesis"
61
 
62
- description = """
63
- The <b>SpeechT5</b> model is pre-trained on text as well as speech inputs, with targets that are also a mix of text and speech.
64
- By pre-training on text and speech at the same time, it learns unified representations for both, resulting in improved modeling capabilities.
65
 
66
- SpeechT5 can be fine-tuned for different speech tasks. This space demonstrates the <b>text-to-speech</b> (TTS) checkpoint for the English language.
67
 
68
- See also the <a href="https://huggingface.co/spaces/Matthijs/speecht5-asr-demo">speech recognition (ASR) demo</a>
69
- and the <a href="https://huggingface.co/spaces/Matthijs/speecht5-vc-demo">voice conversion demo</a>.
70
 
71
- Refer to <a href="https://colab.research.google.com/drive/1i7I5pzBcU3WDFarDnzweIj4-sVVoIUFJ">this Colab notebook</a> to learn how to fine-tune the SpeechT5 TTS model on your own dataset or language.
72
 
73
  <b>How to use:</b> Enter some English text and choose a speaker. The output is a mel spectrogram, which is converted to a mono 16 kHz waveform by the
74
  HiFi-GAN vocoder. Because the model always applies random dropout, each attempt will give slightly different results.
@@ -91,14 +91,14 @@ article = """
91
  primaryClass={eess.AS},
92
  year={2021}
93
  }
94
- </pre>
95
 
96
- <p>Speaker embeddings were generated from <a href="http://www.festvox.org/cmu_arctic/">CMU ARCTIC</a> using <a href="https://huggingface.co/mechanicalsea/speecht5-vc/blob/main/manifest/utils/prep_cmu_arctic_spkemb.py">this script</a>.</p>
97
 
98
  </div>
99
  """
100
 
101
- #examples = [ \
102
  #["It is not in the stars to hold our destiny but in ourselves.", "BDL (male)"],
103
  #["The octopus and Oliver went to the opera in October.", "CLB (female)"],
104
  #["She sells seashells by the seashore. I saw a kitten eating chicken in the kitchen.", "RMS (male)"],
 
14
 
15
  speaker_embeddings = {
16
  "BDL": "spkemb/triniFemale.npy",
17
+ "CLB": "spkemb/triniFemale.npy",
18
+ "KSP": "spkemb/triniFemale.npy",
19
+ "RMS": "spkemb/triniFemale.npy",
20
+ "SLT": "spkemb/triniFemale.npy",
21
  }
22
 
23
 
 
59
 
60
  title = "SpeechT5: Speech Synthesis"
61
 
62
+ #description = "
63
+ #The <b>SpeechT5</b> model is pre-trained on text as well as speech inputs, with targets that are also a mix of text and speech.
64
+ #By pre-training on text and speech at the same time, it learns unified representations for both, resulting in improved modeling capabilities.
65
 
66
+ #SpeechT5 can be fine-tuned for different speech tasks. This space demonstrates the <b>text-to-speech</b> (TTS) checkpoint for the English language.
67
 
68
+ #See also the <a href="https://huggingface.co/spaces/Matthijs/speecht5-asr-demo">speech recognition (ASR) demo</a>
69
+ #and the <a href="https://huggingface.co/spaces/Matthijs/speecht5-vc-demo">voice conversion demo</a>.
70
 
71
+ #Refer to <a href="https://colab.research.google.com/drive/1i7I5pzBcU3WDFarDnzweIj4-sVVoIUFJ">this Colab notebook</a> to learn how to fine-tune the SpeechT5 TTS model on your own dataset or language.
72
 
73
  <b>How to use:</b> Enter some English text and choose a speaker. The output is a mel spectrogram, which is converted to a mono 16 kHz waveform by the
74
  HiFi-GAN vocoder. Because the model always applies random dropout, each attempt will give slightly different results.
 
91
  primaryClass={eess.AS},
92
  year={2021}
93
  }
94
+ #</pre>
95
 
96
+ #<p>Speaker embeddings were generated from <a href="http://www.festvox.org/cmu_arctic/">CMU ARCTIC</a> using <a href="https://huggingface.co/mechanicalsea/speecht5-vc/blob/main/manifest/utils/prep_cmu_arctic_spkemb.py">this script</a>.</p>
97
 
98
  </div>
99
  """
100
 
101
+ #examples = [
102
  #["It is not in the stars to hold our destiny but in ourselves.", "BDL (male)"],
103
  #["The octopus and Oliver went to the opera in October.", "CLB (female)"],
104
  #["She sells seashells by the seashore. I saw a kitten eating chicken in the kitchen.", "RMS (male)"],