oza75 commited on
Commit
6812036
1 Parent(s): bfcd373

Upload new_model_config_01.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. new_model_config_01.json +325 -0
new_model_config_01.json ADDED
@@ -0,0 +1,325 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "output_path": "/workspace/coqui-TTS/finetuning/bambara/run/training",
3
+ "logger_uri": null,
4
+ "run_name": "xtts_lr_6e-06_mel_loss_1.5_epochs_40",
5
+ "project_name": "BAM_FINE_TUNING_3",
6
+ "run_description": "\n GPT XTTS training\n ",
7
+ "print_step": 100,
8
+ "plot_step": 100,
9
+ "model_param_stats": false,
10
+ "wandb_entity": null,
11
+ "dashboard_logger": "wandb",
12
+ "save_on_interrupt": true,
13
+ "log_model_step": 1194,
14
+ "save_step": 10000,
15
+ "save_n_checkpoints": 1,
16
+ "save_checkpoints": true,
17
+ "save_all_best": false,
18
+ "save_best_after": 0,
19
+ "target_loss": null,
20
+ "print_eval": false,
21
+ "test_delay_epochs": 0,
22
+ "run_eval": true,
23
+ "run_eval_steps": null,
24
+ "distributed_backend": "nccl",
25
+ "distributed_url": "tcp://127.0.0.1:54321",
26
+ "mixed_precision": false,
27
+ "precision": "fp16",
28
+ "epochs": 40,
29
+ "batch_size": 12,
30
+ "eval_batch_size": 12,
31
+ "grad_clip": 0.0,
32
+ "scheduler_after_epoch": true,
33
+ "lr": 6e-06,
34
+ "optimizer": "radam",
35
+ "optimizer_params": {
36
+ "betas": [
37
+ 0.9,
38
+ 0.96
39
+ ],
40
+ "eps": 1e-08,
41
+ "weight_decay": 0.01
42
+ },
43
+ "lr_scheduler": "ExponentialLR",
44
+ "lr_scheduler_params": {
45
+ "gamma": 0.989,
46
+ "last_epoch": -1
47
+ },
48
+ "use_grad_scaler": false,
49
+ "allow_tf32": true,
50
+ "cudnn_enable": true,
51
+ "cudnn_deterministic": false,
52
+ "cudnn_benchmark": false,
53
+ "training_seed": 1,
54
+ "model": "xtts",
55
+ "num_loader_workers": 8,
56
+ "num_eval_loader_workers": 0,
57
+ "use_noise_augment": false,
58
+ "audio": {
59
+ "sample_rate": 22050,
60
+ "output_sample_rate": 24000,
61
+ "dvae_sample_rate": 22050
62
+ },
63
+ "use_phonemes": false,
64
+ "phonemizer": null,
65
+ "phoneme_language": null,
66
+ "compute_input_seq_cache": false,
67
+ "text_cleaner": null,
68
+ "enable_eos_bos_chars": false,
69
+ "test_sentences_file": "",
70
+ "phoneme_cache_path": null,
71
+ "characters": null,
72
+ "add_blank": false,
73
+ "batch_group_size": 48,
74
+ "loss_masking": null,
75
+ "min_audio_len": 1,
76
+ "max_audio_len": Infinity,
77
+ "min_text_len": 1,
78
+ "max_text_len": Infinity,
79
+ "compute_f0": false,
80
+ "compute_energy": false,
81
+ "compute_linear_spec": false,
82
+ "precompute_num_workers": 0,
83
+ "start_by_longest": false,
84
+ "shuffle": false,
85
+ "drop_last": false,
86
+ "datasets": [
87
+ {
88
+ "formatter": "",
89
+ "dataset_name": "",
90
+ "path": "",
91
+ "meta_file_train": "",
92
+ "ignored_speakers": null,
93
+ "language": "",
94
+ "phonemizer": "",
95
+ "meta_file_val": "",
96
+ "meta_file_attn_mask": ""
97
+ }
98
+ ],
99
+ "test_sentences": [
100
+ {
101
+ "text": "Dumuni b\u025b taa farikolo fan jum\u025bn ?",
102
+ "speaker_wav": [
103
+ "./reference_audios/bm/speaker_10/0.wav",
104
+ "./reference_audios/bm/speaker_10/1.wav",
105
+ "./reference_audios/bm/speaker_10/3.wav",
106
+ "./reference_audios/bm/speaker_10/4.wav",
107
+ "./reference_audios/bm/speaker_10/5.wav",
108
+ "./reference_audios/bm/speaker_10/6.wav",
109
+ "./reference_audios/bm/speaker_10/7.wav",
110
+ "./reference_audios/bm/speaker_10/8.wav",
111
+ "./reference_audios/bm/speaker_10/9.wav"
112
+ ],
113
+ "language": "bm"
114
+ },
115
+ {
116
+ "text": "Ni sumaya furak\u025bli damin\u025bna, an ka kan ka to ka fura ta ka taa \u0272\u025b, walima ka to ka pikiri ni s\u0254r\u0254muw k\u025b ka taa \u0272\u025b fo sumaya ka ban pew.",
117
+ "speaker_wav": [
118
+ "./reference_audios/bm/speaker_14/0.wav",
119
+ "./reference_audios/bm/speaker_14/1.wav",
120
+ "./reference_audios/bm/speaker_14/2.wav",
121
+ "./reference_audios/bm/speaker_14/3.wav",
122
+ "./reference_audios/bm/speaker_14/4.wav",
123
+ "./reference_audios/bm/speaker_14/5.wav",
124
+ "./reference_audios/bm/speaker_14/6.wav",
125
+ "./reference_audios/bm/speaker_14/7.wav",
126
+ "./reference_audios/bm/speaker_14/8.wav"
127
+ ],
128
+ "language": "bm"
129
+ },
130
+ {
131
+ "text": "A ko k\u025bra degunba ye jamanadenw ma k\u025br\u025bnk\u025br\u025bnna demis\u025bn finitiniw ni m\u0254g\u0254 k\u0254r\u0254baw.",
132
+ "speaker_wav": [
133
+ "./reference_audios/bm/speaker_15/0.wav",
134
+ "./reference_audios/bm/speaker_15/1.wav",
135
+ "./reference_audios/bm/speaker_15/2.wav",
136
+ "./reference_audios/bm/speaker_15/3.wav",
137
+ "./reference_audios/bm/speaker_15/4.wav",
138
+ "./reference_audios/bm/speaker_15/6.wav",
139
+ "./reference_audios/bm/speaker_15/7.wav"
140
+ ],
141
+ "language": "bm"
142
+ },
143
+ {
144
+ "text": "Silam\u025b dannabaaw Burkina Faso la, u ye Eid El Fitr seli k\u025b seli la min k\u025bra sun kalo laban don na .",
145
+ "speaker_wav": [
146
+ "./reference_audios/bm/speaker_27/0.wav",
147
+ "./reference_audios/bm/speaker_27/1.wav",
148
+ "./reference_audios/bm/speaker_27/2.wav",
149
+ "./reference_audios/bm/speaker_27/3.wav",
150
+ "./reference_audios/bm/speaker_27/7.wav",
151
+ "./reference_audios/bm/speaker_27/8.wav",
152
+ "./reference_audios/bm/speaker_27/9.wav"
153
+ ],
154
+ "language": "bm"
155
+ },
156
+ {
157
+ "text": "le texte devra attendre l\u2019avis du Conseil constitutionnel avant son examen \u00e0 l\u2019Assembl\u00e9e.",
158
+ "speaker_wav": [
159
+ "./reference_audios/fr/speaker_100/0.wav",
160
+ "./reference_audios/fr/speaker_100/1.wav",
161
+ "./reference_audios/fr/speaker_100/2.wav",
162
+ "./reference_audios/fr/speaker_100/3.wav",
163
+ "./reference_audios/fr/speaker_100/4.wav",
164
+ "./reference_audios/fr/speaker_100/5.wav",
165
+ "./reference_audios/fr/speaker_100/6.wav",
166
+ "./reference_audios/fr/speaker_100/7.wav",
167
+ "./reference_audios/fr/speaker_100/8.wav",
168
+ "./reference_audios/fr/speaker_100/9.wav"
169
+ ],
170
+ "language": "fr"
171
+ },
172
+ {
173
+ "text": "Below are benchmarks for downsampling and upsampling waveforms between two pairs of sampling rates.",
174
+ "speaker_wav": [
175
+ "./reference_audios/en/speaker_98/0.wav",
176
+ "./reference_audios/en/speaker_98/1.wav",
177
+ "./reference_audios/en/speaker_98/2.wav",
178
+ "./reference_audios/en/speaker_98/3.wav",
179
+ "./reference_audios/en/speaker_98/4.wav",
180
+ "./reference_audios/en/speaker_98/5.wav",
181
+ "./reference_audios/en/speaker_98/6.wav",
182
+ "./reference_audios/en/speaker_98/7.wav",
183
+ "./reference_audios/en/speaker_98/8.wav",
184
+ "./reference_audios/en/speaker_98/9.wav"
185
+ ],
186
+ "language": "en"
187
+ },
188
+ {
189
+ "text": "La convivencia se asienta en Euskadi con la asignatura pendiente de la memoria",
190
+ "speaker_wav": [
191
+ "./reference_audios/es/speaker_47/0.wav",
192
+ "./reference_audios/es/speaker_47/1.wav",
193
+ "./reference_audios/es/speaker_47/2.wav",
194
+ "./reference_audios/es/speaker_47/3.wav",
195
+ "./reference_audios/es/speaker_47/4.wav",
196
+ "./reference_audios/es/speaker_47/5.wav",
197
+ "./reference_audios/es/speaker_47/6.wav",
198
+ "./reference_audios/es/speaker_47/7.wav",
199
+ "./reference_audios/es/speaker_47/8.wav",
200
+ "./reference_audios/es/speaker_47/9.wav"
201
+ ],
202
+ "language": "es"
203
+ },
204
+ {
205
+ "text": "Quei mariuoli di troppo alla corte dell\u2019ex sceriffo. Cos\u00ec il sistema Emiliano sta affondando la Puglia",
206
+ "speaker_wav": [
207
+ "./reference_audios/it/speaker_32/0.wav",
208
+ "./reference_audios/it/speaker_32/1.wav",
209
+ "./reference_audios/it/speaker_32/2.wav",
210
+ "./reference_audios/it/speaker_32/3.wav",
211
+ "./reference_audios/it/speaker_32/4.wav",
212
+ "./reference_audios/it/speaker_32/5.wav",
213
+ "./reference_audios/it/speaker_32/6.wav",
214
+ "./reference_audios/it/speaker_32/7.wav",
215
+ "./reference_audios/it/speaker_32/8.wav",
216
+ "./reference_audios/it/speaker_32/9.wav"
217
+ ],
218
+ "language": "it"
219
+ },
220
+ {
221
+ "text": "Les Insoumis ont obtenu ce mardi 9 avril que le texte soit retir\u00e9 de l\u2019ordre du jour de l\u2019Assembl\u00e9e nationale en attendant un avis du Conseil constitutionnel.",
222
+ "speaker_wav": [
223
+ "./reference_audios/fr/speaker_100/0.wav",
224
+ "./reference_audios/fr/speaker_100/1.wav",
225
+ "./reference_audios/fr/speaker_100/2.wav",
226
+ "./reference_audios/fr/speaker_100/3.wav",
227
+ "./reference_audios/fr/speaker_100/4.wav",
228
+ "./reference_audios/fr/speaker_100/5.wav",
229
+ "./reference_audios/fr/speaker_100/6.wav",
230
+ "./reference_audios/fr/speaker_100/7.wav",
231
+ "./reference_audios/fr/speaker_100/8.wav",
232
+ "./reference_audios/fr/speaker_100/9.wav"
233
+ ],
234
+ "language": "fr"
235
+ }
236
+ ],
237
+ "eval_split_max_size": 256,
238
+ "eval_split_size": 0.01,
239
+ "use_speaker_weighted_sampler": false,
240
+ "speaker_weighted_sampler_alpha": 1.0,
241
+ "use_language_weighted_sampler": false,
242
+ "language_weighted_sampler_alpha": 1.0,
243
+ "use_length_weighted_sampler": false,
244
+ "length_weighted_sampler_alpha": 1.0,
245
+ "model_args": {
246
+ "gpt_batch_size": 1,
247
+ "enable_redaction": false,
248
+ "kv_cache": true,
249
+ "gpt_checkpoint": "",
250
+ "clvp_checkpoint": null,
251
+ "decoder_checkpoint": null,
252
+ "num_chars": 255,
253
+ "tokenizer_file": "/workspace/coqui-TTS/finetuning/bambara/run/training/XTTS_v2.0_original_model_files/vocab.json",
254
+ "gpt_max_audio_tokens": 605,
255
+ "gpt_max_text_tokens": 402,
256
+ "gpt_max_prompt_tokens": 70,
257
+ "gpt_layers": 30,
258
+ "gpt_n_model_channels": 1024,
259
+ "gpt_n_heads": 16,
260
+ "gpt_number_text_tokens": 8130,
261
+ "gpt_start_text_token": 261,
262
+ "gpt_stop_text_token": 0,
263
+ "gpt_num_audio_tokens": 1026,
264
+ "gpt_start_audio_token": 1024,
265
+ "gpt_stop_audio_token": 1025,
266
+ "gpt_code_stride_len": 1024,
267
+ "gpt_use_masking_gt_prompt_approach": true,
268
+ "gpt_use_perceiver_resampler": true,
269
+ "input_sample_rate": 22050,
270
+ "output_sample_rate": 24000,
271
+ "output_hop_length": 256,
272
+ "decoder_input_dim": 1024,
273
+ "d_vector_dim": 512,
274
+ "cond_d_vector_in_each_upsampling_layer": true,
275
+ "duration_const": 102400,
276
+ "min_conditioning_length": 66150,
277
+ "max_conditioning_length": 132300,
278
+ "gpt_loss_text_ce_weight": 0.01,
279
+ "gpt_loss_mel_ce_weight": 1.5,
280
+ "debug_loading_failures": false,
281
+ "max_wav_length": 255995,
282
+ "max_text_length": 200,
283
+ "mel_norm_file": "/workspace/coqui-TTS/finetuning/bambara/run/training/XTTS_v2.0_original_model_files/mel_stats.pth",
284
+ "dvae_checkpoint": "/workspace/coqui-TTS/finetuning/bambara/run/training/XTTS_v2.0_original_model_files/dvae.pth",
285
+ "xtts_checkpoint": "/workspace/coqui-TTS/finetuning/bambara/run/training/xtts_lr_6e-06_mel_loss_1.5_epochs_40-May-08-2024_03+32AM-db6e7cd3/best_model_10737.pth",
286
+ "vocoder": ""
287
+ },
288
+ "model_dir": null,
289
+ "languages": [
290
+ "en",
291
+ "es",
292
+ "fr",
293
+ "de",
294
+ "it",
295
+ "pt",
296
+ "pl",
297
+ "tr",
298
+ "ru",
299
+ "nl",
300
+ "cs",
301
+ "ar",
302
+ "zh-cn",
303
+ "hu",
304
+ "ko",
305
+ "ja",
306
+ "hi",
307
+ "bm"
308
+ ],
309
+ "temperature": 0.85,
310
+ "length_penalty": 1.0,
311
+ "repetition_penalty": 2.0,
312
+ "top_k": 50,
313
+ "top_p": 0.85,
314
+ "num_gpt_outputs": 1,
315
+ "gpt_cond_len": 12,
316
+ "gpt_cond_chunk_len": 4,
317
+ "max_ref_len": 10,
318
+ "sound_norm_refs": true,
319
+ "optimizer_wd_only_on_weights": false,
320
+ "weighted_loss_attrs": {},
321
+ "weighted_loss_multipliers": {},
322
+ "transliterate_bambara": false,
323
+ "warmup_steps": null,
324
+ "warmup_start_lr": 0.1
325
+ }