File size: 710 Bytes
9206300
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
base_config: ./transformer_tts.yaml
pre_align_args:
  trim_sil: true
binarization_args:
  shuffle: true
  with_txt: true
  with_wav: false
  with_align: false
  with_spk_embed: false
  with_f0: false
  with_f0cwt: false
num_spk: 9999999
binarizer_cls: data_gen.asr.asr_binarize.ASRBinarizer
strides: [ 2,2,1 ]
enc_ffn_kernel_size: 15
encoder_hidden_size: 256

model_type: trans
# for LSTM decoder
decoder_hidden_size: 512
decoder_rnn_dim: 512
p_attention_dropout: 0.05
p_decoder_dropout: 0.05
attention_rnn_dim: 512
attention_dim: 256
attention_location_n_filters: 16
attention_location_kernel_size: 15

max_frames: 3000
enc_layers: 8
dec_layers: 4
dec_ffn_kernel_size: 1
max_tokens: 40000
max_updates: 400000