Text-to-Speech
Fairseq
English
audio
multi-speaker
File size: 636 Bytes
473c5e0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
features:
  energy_max: 5.646703243255615
  energy_min: -3.548804759979248
  eps: 1.0e-05
  f_max: 8000
  f_min: 0
  hop_len_t: 0.011609977324263039
  hop_length: 256
  n_fft: 1024
  n_mels: 80
  n_stft: 513
  pitch_max: 5.164862652912731
  pitch_min: -2.5049682966705484
  sample_rate: 22050
  type: spectrogram+melscale+log
  win_len_t: 0.046439909297052155
  win_length: 1024
  window_fn: hann
global_cmvn:
  stats_npz_path: gcmvn_stats.npz
transforms:
  '*':
  - global_cmvn
vocab_filename: vocab.txt
speaker_set_filename: speakers.txt
vocoder:
  type: hifigan
  config: hifigan.json
  checkpoint: hifigan.bin
hub:
  phonemizer: g2p