diff --git a/full_models/abi/D_100000.pth b/full_models/abi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4d9ba161fd06d5feb0cd27d3ccfe1f4b6b7cd23c --- /dev/null +++ b/full_models/abi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be668a16e5b9b9dedd41e08442644f4ed894e4c62f43d06e7e448158428e2fe +size 561098185 diff --git a/full_models/abi/G_100000.pth b/full_models/abi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3da2d1b1bad153179fcbf0d6e99b6b62a8d23326 --- /dev/null +++ b/full_models/abi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bee8bd93805bd44cee1ff5497bc3a87220eeeec8b0fd6a2368d0609001a2868 +size 436570305 diff --git a/full_models/abi/config.json b/full_models/abi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/abi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/abi/vocab.txt b/full_models/abi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4a994d1d83ffb58a9050ed3b2944571dacdeb19d --- /dev/null +++ b/full_models/abi/vocab.txt @@ -0,0 +1,53 @@ +ɔ +ê +ǒ + +̂ +h +ě +i +ɩ +k +á +̌ +ǐ +b +p +í +ǔ +u +ń +w +' +ί +f +ó +y +s +î +m +ɛ +έ +e +ʋ +ḿ +n +ú +o +d +â +ô +c +ǎ +é +́ +j +l +- +t +_ +r +g +ε +û +a diff --git a/full_models/abp/D_100000.pth b/full_models/abp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be4880b6687ff9f2984ee43c1b678e802079e6ac --- /dev/null +++ b/full_models/abp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3176637b067b5fc78605aff0b553ec09244da37ebbff3f419163cede7824c441 +size 561098185 diff --git a/full_models/abp/G_100000.pth b/full_models/abp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..69e8e15728c4e63ef9fda591cdf5c6fb8e041a97 --- /dev/null +++ b/full_models/abp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f621739a139733b14ac70f032ab4a677e8912fa3a1132ba3f8cf599dee6dbbac +size 436524225 diff --git a/full_models/abp/config.json b/full_models/abp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/abp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/abp/vocab.txt b/full_models/abp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6212eeac9b50a1f9c557d0c58b81f310fb37105c --- /dev/null +++ b/full_models/abp/vocab.txt @@ -0,0 +1,33 @@ +_ +t +e +b +ō +j +c +r +f +w +i +q +h +g +l +m +k +y +d +ā +s +' +a +n +x +6 +o +- +p +u + +v +z diff --git a/full_models/aca/D_100000.pth b/full_models/aca/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..34709ae421999948d7bae197eb67717623718303 --- /dev/null +++ b/full_models/aca/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae308c0880cb4e3bd2d02600485b473f068c38ff85bac0a7d5bd8951ba1ce963 +size 561076199 diff --git a/full_models/aca/G_100000.pth b/full_models/aca/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..650482ef6329f56c71acb5d7dfc22a013737fd43 --- /dev/null +++ b/full_models/aca/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78666df5cbdca3fbd91b2bb2f49841f8919b7a73ab6e504ed82f7597e41c190f +size 436353726 diff --git a/full_models/aca/config.json b/full_models/aca/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/aca/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/aca/vocab.txt b/full_models/aca/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4084ed70136d3cc1b19011be47c72f83cf27cbc7 --- /dev/null +++ b/full_models/aca/vocab.txt @@ -0,0 +1,35 @@ +a +| +i +n +á +c +e +u +l +r +w +j +s +í +m +é +o +' +h +t +y +b +d +ú +q +ó +p +— +g +f +z +v +x +ñ + diff --git a/full_models/acd/D_100000.pth b/full_models/acd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f428b2fd06947ba1d480d6529fb4f676908e3a56 --- /dev/null +++ b/full_models/acd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c06f2853c68b0bc604a40caa9261cf439f0b02d66a510b08a0660b0f8e3201 +size 561078480 diff --git a/full_models/acd/G_100000.pth b/full_models/acd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ec84b4f9ddd9238fd4db4b14d41ecfd5956b97c --- /dev/null +++ b/full_models/acd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2d3e15a2db968008b7b01eb6282b9c24115221f2abccd8935ee11a16d6f6cf9 +size 436355114 diff --git a/full_models/acd/config.json b/full_models/acd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/acd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/acd/vocab.txt b/full_models/acd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5c7d657c6db735544c06fd99177080daddff11e3 --- /dev/null +++ b/full_models/acd/vocab.txt @@ -0,0 +1,28 @@ +| +a +ɛ +n +ɔ +i +o +m +y +e +u +g +s +k +b +r +l +d +w +f +- +t +p +' +ŋ +h +c + diff --git a/full_models/ace/D_100000.pth b/full_models/ace/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b72ffb7a43dad532db36ee14b4cc8c804e05e58e --- /dev/null +++ b/full_models/ace/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecacad3f1f738085d053f35c5618c4abceaee39c28dbff2975e17fc918cea5c7 +size 561078594 diff --git a/full_models/ace/G_100000.pth b/full_models/ace/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c55c16e663d8c497f5a61406a2cd7f0c427dba86 --- /dev/null +++ b/full_models/ace/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183895b264e9f91617ababbd088b5309ea79468730819506c8c8ab5e977085e6 +size 436387528 diff --git a/full_models/ace/config.json b/full_models/ace/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ace/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ace/vocab.txt b/full_models/ace/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5370d0f0f0f212614f1bec2acd6aa7d39b4d6112 --- /dev/null +++ b/full_models/ace/vocab.txt @@ -0,0 +1,42 @@ +| +a +n +e +u +g +t +h +i +k +m +b +o +y +l +r +s +p +j +d +é +w +ô +ë +- +c +ö +á +ó +f +z +' +q +ú +` +0 +6 +4 +3 +1 +2 + diff --git a/full_models/acf/D_100000.pth b/full_models/acf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4cd4ecd7ab7203c43efb248b582d7a65b0f68df9 --- /dev/null +++ b/full_models/acf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:262ec2da7c0e7ded6eaa1cd84e37fe55127f23280d272d9453591df621511b21 +size 561078869 diff --git a/full_models/acf/G_100000.pth b/full_models/acf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2a207157fbcf16ea52dc90a2e0cd26a0afa1cacb --- /dev/null +++ b/full_models/acf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f23d7c73bfdf05bec98d6fc71dffbf19409a9afb463b6974abccdaee53c215 +size 436369451 diff --git a/full_models/acf/config.json b/full_models/acf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/acf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/acf/vocab.txt b/full_models/acf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bbd6591007a7d7d32b96903e4d1e2e7071d4a770 --- /dev/null +++ b/full_models/acf/vocab.txt @@ -0,0 +1,33 @@ +| +a +n +é +i +o +s +t +k +y +p +l +w +m +è +u +d +- +e +b +v +j +ò +z +f +ʼ +h +g +c +r +— +' + diff --git a/full_models/ach/D_100000.pth b/full_models/ach/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..27017db5a6a95dd26dfff4474dd67367e03062c3 --- /dev/null +++ b/full_models/ach/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d772464b61e01ae7415ad3b4cae63851b5fd89c15b6157b311446e3f3ea7460c +size 561078618 diff --git a/full_models/ach/G_100000.pth b/full_models/ach/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5773576754c98de8b157f7ae16fd8a7d8d367c9c --- /dev/null +++ b/full_models/ach/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46031da7d624512421e115dcfadede182580c6c3139d2ea2b7c20b4fabee7e1d +size 436355251 diff --git a/full_models/ach/config.json b/full_models/ach/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ach/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ach/vocab.txt b/full_models/ach/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..14f296445302e01b5d6d683ee1206b8c0d7054a9 --- /dev/null +++ b/full_models/ach/vocab.txt @@ -0,0 +1,28 @@ +| +o +a +i +e +k +n +m +w +t +u +y +l +c +d +b +g +r +p +ŋ +j +- +s +' +v +f +h + diff --git a/full_models/acn/D_100000.pth b/full_models/acn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..67db02a732ce52f1c5a978ab838c253a9e24fe77 --- /dev/null +++ b/full_models/acn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7c7622cba3d3aa313a67157d78898fcffb20dc0855d9c9ac93e544a79b11f3 +size 561098185 diff --git a/full_models/acn/G_100000.pth b/full_models/acn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..807d11b27f7a85b63e3337dc5c5bfed5ca56c08c --- /dev/null +++ b/full_models/acn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f608e1298f921bba8ebfa9e1eadb3c599aff4a0eb64614fb32a3d372340a9b4b +size 436533441 diff --git a/full_models/acn/config.json b/full_models/acn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/acn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/acn/vocab.txt b/full_models/acn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..249bc5cef2d99e3605690cb42aa8aae3254d9940 --- /dev/null +++ b/full_models/acn/vocab.txt @@ -0,0 +1,37 @@ +u +k +g +a +_ +— +d +w +i +o +- +b +e +n +t +y +p +s +z +x +m +h +c + +l +0 +2 +j +f +3 +5 +q +v +r +6 +1 +4 diff --git a/full_models/acr/D_100000.pth b/full_models/acr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ac432042a447204f26ea116db59eab39fc8d012f --- /dev/null +++ b/full_models/acr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2e790e6b73ad3a311ec0bd311e50a33846f38b8e63f074650687a6f588ea7df +size 561078709 diff --git a/full_models/acr/G_100000.pth b/full_models/acr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02d432c3f962a71e50a72a34f020c4f048a98508 --- /dev/null +++ b/full_models/acr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892faf58e703daf31d96bd7b9913d2b0eda8f750305282ba760a656280a5437f +size 436375881 diff --git a/full_models/acr/config.json b/full_models/acr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/acr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/acr/vocab.txt b/full_models/acr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..77e4d297fd3ec3aba11fb74c4ecb53620ae68fed --- /dev/null +++ b/full_models/acr/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +' +k +r +u +e +j +n +o +c +l +h +t +q +w +x +m +b +s +y +p +z +d +— +ú +g +á +é +ó +f +í +v +- +ñ + diff --git a/full_models/acu/D_100000.pth b/full_models/acu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e46bf90ddc46363eec3020c6694fa6c700417942 --- /dev/null +++ b/full_models/acu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e8f2db7fee9018cff7d22ff7ede80bfcfb408c2cb3a38a3ccf32f1594865969 +size 561078587 diff --git a/full_models/acu/G_100000.pth b/full_models/acu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..23c95902e37560b390d4a3a9d5ae4dd0dd614f2c --- /dev/null +++ b/full_models/acu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5952ecca5322b2410a5056b1852650d2fb9289f3cebce5e9b95a7ee76eabc621 +size 436371382 diff --git a/full_models/acu/config.json b/full_models/acu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/acu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/acu/vocab.txt b/full_models/acu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8a5265c61e4973a3fe8660e120f05420e52f25e7 --- /dev/null +++ b/full_models/acu/vocab.txt @@ -0,0 +1,35 @@ +a +| +i +n +u +t +r +m +k +s +e +h +j +c +w +y +p +g +o +í +— +ú +d +l +é +á +b +f +v +ó +z +q +x +ñ + diff --git a/full_models/ade/D_100000.pth b/full_models/ade/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..250e4498beefdeae3f133692fde4753c0902e21b --- /dev/null +++ b/full_models/ade/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41191e5d74955fec278ea692b2218c7920de8f16147aba556fdfce56b714f4c0 +size 561078757 diff --git a/full_models/ade/G_100000.pth b/full_models/ade/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..30ac31438323ad33c762825076456908f0fbeb8e --- /dev/null +++ b/full_models/ade/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed6df678ce5a605da1adef5aa7016ec89dd3b209ffebad3156843473d688668 +size 436384590 diff --git a/full_models/ade/config.json b/full_models/ade/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ade/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ade/vocab.txt b/full_models/ade/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c2dd6bded46e62603c493f1763ffd87e64925848 --- /dev/null +++ b/full_models/ade/vocab.txt @@ -0,0 +1,40 @@ +| +a +â +n +e +b +g +æ +i +t +w +ô +y +k +o +r +l +u +d +m +f +s +û +p +à +- +è +ã +õ +ù +î +å +ì +ü +ǹ +ò +h +' +c + diff --git a/full_models/adh/D_100000.pth b/full_models/adh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d79025eff8df2a4af64ee5fa584fc64640fe7638 --- /dev/null +++ b/full_models/adh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f466d6d8e81596e107e5e3ebb2f5fea640411555a9ae7a6b719bc80f0d11f42 +size 561078757 diff --git a/full_models/adh/G_100000.pth b/full_models/adh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8cac735bf6470dbcc96f5ec54c30336889f335c0 --- /dev/null +++ b/full_models/adh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6a6d6796cd6997ca30c352c12f25d36db4d80ac374e42318aeba8a2ce1905a +size 436360329 diff --git a/full_models/adh/config.json b/full_models/adh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/adh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/adh/vocab.txt b/full_models/adh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e09bdb8ae2b23055bbbc6091c3c079d3de54006c --- /dev/null +++ b/full_models/adh/vocab.txt @@ -0,0 +1,29 @@ +| +o +i +a +e +n +k +m +w +r +y +h +t +d +j +g +u +l +p +c +b +ŋ +s +f +' +z +v +- + diff --git a/full_models/adj/D_100000.pth b/full_models/adj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..87940569b25ce7a093b9a4e1128455bf3391c276 --- /dev/null +++ b/full_models/adj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77757247ee18a706cb7cf12cf3c01269b4d96d9db1810496d5cecde1e4b37c5e +size 561078768 diff --git a/full_models/adj/G_100000.pth b/full_models/adj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e838d5932936299173bca68cb563f653324545c5 --- /dev/null +++ b/full_models/adj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2841867f1f11ff7ef9a742e17c9847b747fbad5b2e027b43bf2268f1570e04d5 +size 436399987 diff --git a/full_models/adj/config.json b/full_models/adj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/adj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/adj/vocab.txt b/full_models/adj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..734675457589febdbbf74363fa21218a2c9367b6 --- /dev/null +++ b/full_models/adj/vocab.txt @@ -0,0 +1,46 @@ +| +a +e +ɛ +n +m +l +k +i +ŋ +' +s +b +o +y +w +ɔ +u +r +g +c +t +d +j +f +p +- +ó +́ +í +̀ +á +h +é +ì +ò +ú +à +ê +v +ù +̂ +è +z +ô + diff --git a/full_models/adx/D_100000.pth b/full_models/adx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1c08fec5ef88d4e2609d2987c8396d61ff444360 --- /dev/null +++ b/full_models/adx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7960f71cdada5c2b176fd325db6561e010038a5ba369b8cfb5d182935ad0970f +size 561098185 diff --git a/full_models/adx/G_100000.pth b/full_models/adx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6c65e57cf7a28632fee777602873421ad5763ae7 --- /dev/null +++ b/full_models/adx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb710ce2a77955594e5c822914d1a879a51d642356a6338e8e17fa6b9735498 +size 436584129 diff --git a/full_models/adx/config.json b/full_models/adx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/adx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/adx/vocab.txt b/full_models/adx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7aabb89c5b12f45477e7bdc34fe8cfe15e9a82b9 --- /dev/null +++ b/full_models/adx/vocab.txt @@ -0,0 +1,59 @@ +ཤ +ྐ +ི +འ +ཞ + +ྩ +པ +ྫ +ྱ +ྭ +ཙ +ད +ཁ +ྔ +ྷ +ུ +ེ +ོ +_ +ྡ +ཆ +མ +ྟ +ྤ +ན +ཉ +ཛ +ཊ +ཏ +ྦ +ྨ +ང +ཪ +ཟ +ས +ཚ +ྣ +ླ +ཇ +ྗ +ཨ +ྙ +ྒ +བ +ཅ +ཧ +ྲ +ཝ +ཡ +ཱ +ག +ཀ +ར +ཐ +ཕ +ྕ +ལ +་ diff --git a/full_models/aeu/D_100000.pth b/full_models/aeu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91f741e44b0f5d842eede2610f8a8fd383d5861d --- /dev/null +++ b/full_models/aeu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ef66fa37d86afbecd23619f940c3c4ba3ea5f053ee90bdc109dcdb81a3d580 +size 561098185 diff --git a/full_models/aeu/G_100000.pth b/full_models/aeu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..94795f03da12560d81dd81740b8fadf4aad70577 --- /dev/null +++ b/full_models/aeu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9319d4e75b7c46d3d16ac5ce566588b5b6f47fd96fcbada2d07b57d5f8f2e6a +size 436505793 diff --git a/full_models/aeu/config.json b/full_models/aeu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/aeu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/aeu/vocab.txt b/full_models/aeu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c54a7f4738f10defc9b2bfa2d2d5361d2f1181ea --- /dev/null +++ b/full_models/aeu/vocab.txt @@ -0,0 +1,25 @@ +b +j +g +t +u +- +k +q +s +i +e +l +o +p +_ +y +n +c +v + +m +h +d +a +w diff --git a/full_models/agd/D_100000.pth b/full_models/agd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..971a88a06ed34f1b3582eb44b9e3cd0222b15169 --- /dev/null +++ b/full_models/agd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04904daf1217f960beeb3bd26bb4e958380c5e1ebf85f4934c661a9b66daf617 +size 561098185 diff --git a/full_models/agd/G_100000.pth b/full_models/agd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1911f285b4ae2815016a97983f361027d9a5ee12 --- /dev/null +++ b/full_models/agd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b777c97ed4d4a860802ca68c48c48c413abc6add43eb620f2fcbe11c3b55b464 +size 436517313 diff --git a/full_models/agd/config.json b/full_models/agd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/agd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/agd/vocab.txt b/full_models/agd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9b96e7aae09da8a03795308a1cd2188e117e7981 --- /dev/null +++ b/full_models/agd/vocab.txt @@ -0,0 +1,30 @@ +3 +p +y +f +ó +4 +0 +á +m +- +r +h + +t +d +o +é +' +s +b +e +n +u +_ +v +ú +í +a +i +k diff --git a/full_models/agg/D_100000.pth b/full_models/agg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ae7d463d75891a73b4bf98f7af2963342f80e4e4 --- /dev/null +++ b/full_models/agg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6be729fc918766135efd129c642966bdc1d935d8247b18c58977b7c19be47fd1 +size 561076019 diff --git a/full_models/agg/G_100000.pth b/full_models/agg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..24c67ba9a33cfcd3c4734718cbcf11573e508dd0 --- /dev/null +++ b/full_models/agg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236cc80eced13e28464f10b554321a26eb582ebf2b1aebf41a0759fbb67c1743 +size 436347563 diff --git a/full_models/agg/config.json b/full_models/agg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/agg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/agg/vocab.txt b/full_models/agg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..facf0a9e4869c6abd24fbab16bde1637e8dd0432 --- /dev/null +++ b/full_models/agg/vocab.txt @@ -0,0 +1,33 @@ +a +| +ɨ +o +n +m +h +r +u +d +i +b +e +s +ü +y +f +g +ŋ +k +w +p +t +- +0 +1 +7 +2 +4 +5 +6 +3 + diff --git a/full_models/agn/D_100000.pth b/full_models/agn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5dabe9f5c12ae3daea8575c292fdb75a4997e4e --- /dev/null +++ b/full_models/agn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ad91b0eb20455789a1a0dbc3b0918acf325934af65b400d48e5a79a5f1a446 +size 561078506 diff --git a/full_models/agn/G_100000.pth b/full_models/agn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b3528aca5062347b5af346889604842419ed8dcc --- /dev/null +++ b/full_models/agn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d17fcceded3f482f6130c5b36a88ad6e1753781cf0a18ed9092fd5c639f2bc +size 436382640 diff --git a/full_models/agn/config.json b/full_models/agn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/agn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/agn/vocab.txt b/full_models/agn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..29c88df40b9a8c0a3aba63215a6a5777f1832f77 --- /dev/null +++ b/full_models/agn/vocab.txt @@ -0,0 +1,40 @@ +a +| +n +g +i +o +t +m +d +s +l +e +p +r +k +b +y +w +- +u +j +c +h +f +z +v +q +' +ā +ō +0 +x +1 +— +6 +ē +5 +2 +7 + diff --git a/full_models/agr/D_100000.pth b/full_models/agr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c990287b0370a236d7c912c46d284ba60d57ca50 --- /dev/null +++ b/full_models/agr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bedc0a3cfbaac3726afb632a2931831aba9cb79b78914b22d946ef59cf74b86 +size 561078705 diff --git a/full_models/agr/G_100000.pth b/full_models/agr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ced6da2df9e01b96a68543cf7770db286befeee7 --- /dev/null +++ b/full_models/agr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a4438c21efc7de9db4dca5f83c5b532bec1d031322c53902c0f13d4f352ab0 +size 436379514 diff --git a/full_models/agr/config.json b/full_models/agr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/agr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/agr/vocab.txt b/full_models/agr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..753b549be4b59b79f33227dc7439772b7584fa70 --- /dev/null +++ b/full_models/agr/vocab.txt @@ -0,0 +1,38 @@ +a +| +i +u +n +t +k +m +j +s +e +g +h +w +d +p +c +y +í +b +r +o +á +ú +l +— +é +f +' +v +z +ó +q +x +ñ +2 +7 + diff --git a/full_models/agu/D_100000.pth b/full_models/agu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2cc445f99e869978f93174bb950a2c38c294945f --- /dev/null +++ b/full_models/agu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0b37c8104f711173ead1819a216a234c46b8bae96881469f41f3d74ba96814 +size 561098185 diff --git a/full_models/agu/G_100000.pth b/full_models/agu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..55c105edaed976ada2a3ce53cc789f85a5f6be81 --- /dev/null +++ b/full_models/agu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b435c0cad3a4bcedc1b6be5ed3b1bbb948f33ddf21de630a0a28e1270197baa +size 436540353 diff --git a/full_models/agu/config.json b/full_models/agu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/agu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/agu/vocab.txt b/full_models/agu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c49027bc328668cc91d2dd5c6d7a5dc1a271e664 --- /dev/null +++ b/full_models/agu/vocab.txt @@ -0,0 +1,40 @@ +j +r +ó +b +é +s +t +v +g +i +x +k +f + +d +— +6 +y +z +c +h +u +m +p +a +ẍ +- +w +o +n +e +' +ꞌ +ñ +ú +í +á +_ +q +l diff --git a/full_models/agx/D_100000.pth b/full_models/agx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6a7b450c01d0bf122185c2434be41901a0c3ee24 --- /dev/null +++ b/full_models/agx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2bfd1cbfe032dd0aa4f2361e8bd1a7c294b9a6702eacb2f8d1bf278c916f71 +size 561076023 diff --git a/full_models/agx/G_100000.pth b/full_models/agx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e126fef26e66fe7d8ae549099a5c3b0b98e7231d --- /dev/null +++ b/full_models/agx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:864a2ce8528d1b0ccd420a12d4e54931810222bdd1f140ad28e94d6360561083 +size 436349861 diff --git a/full_models/agx/config.json b/full_models/agx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/agx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/agx/vocab.txt b/full_models/agx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9d3f1c172babfb0e8abf8ef91f48c1b6b135f073 --- /dev/null +++ b/full_models/agx/vocab.txt @@ -0,0 +1,34 @@ +а +| +и +у +н +е +р +с +г +ь +к +д +л +х +ӏ +т +в +ъ +й +ч +я +м +б +п +ф +з +ш +э +ж +– +ц +ю +о + diff --git a/full_models/aha/D_100000.pth b/full_models/aha/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dd5a6e285d9a9eca4eb1d5efb767c722a01542ee --- /dev/null +++ b/full_models/aha/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e09112795fcc1f1d56cae41973badc5a0988c9c9816645c3387f7cba70ffc09 +size 561078329 diff --git a/full_models/aha/G_100000.pth b/full_models/aha/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82488ca0c9e33eb986fe909c6cf2bab0457375ae --- /dev/null +++ b/full_models/aha/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa5c360968d0561979edfef45f838489ecc1130b872db018c7277535374b44b +size 436397093 diff --git a/full_models/aha/config.json b/full_models/aha/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/aha/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/aha/vocab.txt b/full_models/aha/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dc236e9316bd8128d0f3a9b605c1dc0e71c2923e --- /dev/null +++ b/full_models/aha/vocab.txt @@ -0,0 +1,47 @@ +| +ɩ +n +a +ɛ +m +i +l +ɔ +y +b +ʋ +e +w +k +u +d +s +z +o +t +h +̃ +g +v +ɣ +p +f +á +ĩ +ã +́ +í +é +ũ +0 +ó +' +ú +1 +2 +5 +4 +6 +3 +7 + diff --git a/full_models/ahk/D_100000.pth b/full_models/ahk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d4f22166d3099b88e3d0c84d4ddc3760fbdf0cc2 --- /dev/null +++ b/full_models/ahk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b813c744ce748161f35cbed36655e05358e3c5b3be27053cc9faf2f7b140b787 +size 561076191 diff --git a/full_models/ahk/G_100000.pth b/full_models/ahk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e52de23077375b9c6862c6c18b5d7b258d5880af --- /dev/null +++ b/full_models/ahk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0536aa9fb28cd98aed15737c37068e509d26d61f867c16ae036e12f6fe59527 +size 436342089 diff --git a/full_models/ahk/config.json b/full_models/ahk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ahk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ahk/vocab.txt b/full_models/ahk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cf8112899696e4294a029010d68899b309132025 --- /dev/null +++ b/full_models/ahk/vocab.txt @@ -0,0 +1,30 @@ +| +a +ˬ +e +h +u +- +w +m +i +̭ +n +y +' +l +g +d +s +k +t +o +ˆ +j +b +p +z +c +` +f + diff --git a/full_models/aia/D_100000.pth b/full_models/aia/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f1e5667d63ffda35e4c1d993715acd0b3180c3d6 --- /dev/null +++ b/full_models/aia/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f27cdf91972ff460b4ce4c9fdd6b791e5bf1bb458f8448f1b9aff31079e75b75 +size 561098185 diff --git a/full_models/aia/G_100000.pth b/full_models/aia/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2d82106df001072878ccac74b87082bda5d2c30f --- /dev/null +++ b/full_models/aia/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a47a4387c822eb3eb3fabb8faedf55c16c9f11f0e0764627c3227f55726eb81 +size 436515009 diff --git a/full_models/aia/config.json b/full_models/aia/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/aia/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/aia/vocab.txt b/full_models/aia/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..112d50bb3e5421c07bd690138eaf447cd251f603 --- /dev/null +++ b/full_models/aia/vocab.txt @@ -0,0 +1,29 @@ +d +j +a +t +c +y + +m +g +v +6 +_ +b +u +e +w +- +h +p +ꞌ +r +f +s +l +n +o +— +i +k diff --git a/full_models/aka/D_100000.pth b/full_models/aka/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be89d073ed3384ff4e3c6c39dc3ac2a66a9eee35 --- /dev/null +++ b/full_models/aka/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb7917fdf8de5e517a7832cc0b1be116755c6618f17c8eaa7d065b81b42e642 +size 561098185 diff --git a/full_models/aka/G_100000.pth b/full_models/aka/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3eeb2d5ff46232668e2a57a0ca0e336532d8062b --- /dev/null +++ b/full_models/aka/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3b8551f70d75147bdd401369ae9b6fd532a21113232b6881610bfa04528ae7 +size 436517313 diff --git a/full_models/aka/config.json b/full_models/aka/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/aka/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/aka/vocab.txt b/full_models/aka/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1acf3892d40041550f0dfb085f24afcde0768cbb --- /dev/null +++ b/full_models/aka/vocab.txt @@ -0,0 +1,30 @@ +a +ʼ +t +- +n +' +_ +3 + +p +m +á +w +y +ɛ +f +o +g +u +k +h +l +s +2 +e +r +i +ɔ +d +b diff --git a/full_models/akb/D_100000.pth b/full_models/akb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..811c28b66597c6d88828697ce7b2f783ae7606fc --- /dev/null +++ b/full_models/akb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d9e3b79fd05b6fcd721a40178851c0b988377976931bd40c54f6109cf29bf0 +size 561098185 diff --git a/full_models/akb/G_100000.pth b/full_models/akb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b77a60c6117d0905e5bcd47600b8d8f40b44e055 --- /dev/null +++ b/full_models/akb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:181f47d37ce569d9082d1fd873336da29cf41a9791a6826ee91eac33984df712 +size 436526529 diff --git a/full_models/akb/config.json b/full_models/akb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/akb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/akb/vocab.txt b/full_models/akb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4c804c545e6ca6e7738a9cdad85f43358d73b231 --- /dev/null +++ b/full_models/akb/vocab.txt @@ -0,0 +1,34 @@ +4 +g +n +l +k +w +0 +r +j +1 + +s +i +5 +u +z +v +b +- +' +2 +h +p +e +d +t +m +y +_ +a +c +f +6 +o diff --git a/full_models/ake/D_100000.pth b/full_models/ake/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0bb0d98fcbe16d25b865136dfcc5a436007a54a1 --- /dev/null +++ b/full_models/ake/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6429799472b0ce9428ef77c0e9db4e4bd6ec9aa9d76397e73af8caa90c98501 +size 561098185 diff --git a/full_models/ake/G_100000.pth b/full_models/ake/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a19cd1989bc66f6ddb182ba6fb9a2ebbc87c99e1 --- /dev/null +++ b/full_models/ake/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d349d1834df9a613aacaafe9e1b9d3777d165e6c651ba9bd67bc0fceb13b834b +size 436521921 diff --git a/full_models/ake/config.json b/full_models/ake/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ake/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ake/vocab.txt b/full_models/ake/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b891524633a9322b1c586fa2d934558abdcaae8b --- /dev/null +++ b/full_models/ake/vocab.txt @@ -0,0 +1,32 @@ +– +y +w +1 +k +7 +ɨ + +r +0 +_ +p +n +8 +9 +t +u +' +s +i +3 +- +a +5 +6 +o +e +4 +ʉ +— +m +2 diff --git a/full_models/akp/D_100000.pth b/full_models/akp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b3579b110b25c677c5818f6ac1b97c67847402f8 --- /dev/null +++ b/full_models/akp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3208b85cc559ba8b8e109d91dd4a4867e21c1f2a9a734f33fb88e9916b21faeb +size 561098185 diff --git a/full_models/akp/G_100000.pth b/full_models/akp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6107f4e8a5dffa9339222652467bb53b62058a8a --- /dev/null +++ b/full_models/akp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8028de805837c343e5479997896b17f815377869174d7015598053dbfb31621a +size 436528833 diff --git a/full_models/akp/config.json b/full_models/akp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/akp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/akp/vocab.txt b/full_models/akp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0628e29ad981378df423612d210d722ae1d36b23 --- /dev/null +++ b/full_models/akp/vocab.txt @@ -0,0 +1,35 @@ +t +' +ɖ +h +- +r +n +p +ɣ +a +l +v +ɛ +g +ã +o +z +m +i +d +w +f +ɔ +ĩ +s +u +6 +b + +̃ +ũ +e +y +k +_ diff --git a/full_models/alj/D_100000.pth b/full_models/alj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe23aef169106907e80d272263b0119bf7275e0b --- /dev/null +++ b/full_models/alj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b659fee053e0d9533613135c39c4784e7820e73d0e77d9efd6945f797263e0d +size 561078742 diff --git a/full_models/alj/G_100000.pth b/full_models/alj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0eea449380142b83bda3ea7723272b34309569df --- /dev/null +++ b/full_models/alj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc8fb4b7749a3d6e734fafbeb4046e333de54105c23e064abf70a43d186fcd66 +size 436350347 diff --git a/full_models/alj/config.json b/full_models/alj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/alj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/alj/vocab.txt b/full_models/alj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d36ec1f02a68f4cd113cae00aa88d92d77233c61 --- /dev/null +++ b/full_models/alj/vocab.txt @@ -0,0 +1,25 @@ +a +| +n +i +o +g +y +k +s +t +m +p +e +b +w +l +d +r +0 +4 +1 +5 +3 +ɩ + diff --git a/full_models/alp/D_100000.pth b/full_models/alp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..52610014d2628d2a4ad886b9c86bc12079b7dfe2 --- /dev/null +++ b/full_models/alp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ab8dd11340d3a58f25105136bfce9eb95bf698242b17900cfba472b5d9401da +size 561098185 diff --git a/full_models/alp/G_100000.pth b/full_models/alp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2c9b8a6af615693e7d8741d1c74be5533c05c5c7 --- /dev/null +++ b/full_models/alp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aae1d533d0e216e8b8368f88ac021b7576c36ff043f91cc838c8d484fa1f7d91 +size 436517313 diff --git a/full_models/alp/config.json b/full_models/alp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/alp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/alp/vocab.txt b/full_models/alp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f12d463b3d6c1f9a35aeb6548c973b70c835c5da --- /dev/null +++ b/full_models/alp/vocab.txt @@ -0,0 +1,30 @@ +j +- +y +1 +c +' +_ +r +e +t +u +b +g +w +l +i +o +2 +f +4 +s +h +n +m +k +a +0 + +p +d diff --git a/full_models/alt/D_100000.pth b/full_models/alt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f9eaad45ed7409e67f23d8c33e127b596ac570f6 --- /dev/null +++ b/full_models/alt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de61999149b5dff341a9783af241bb5186bfb60e9386974953abf12049894e77 +size 561078756 diff --git a/full_models/alt/G_100000.pth b/full_models/alt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9b05d2cb562f07f909f0924b57fcd62649b1c0e2 --- /dev/null +++ b/full_models/alt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ae6da9e961b8061d6cb60ce76bf7e1e5b72316a0894a0f0b9a1d325d439d24 +size 436397483 diff --git a/full_models/alt/config.json b/full_models/alt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/alt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/alt/vocab.txt b/full_models/alt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..60774c5cf6765a3326c036c4027166498a2d9e80 --- /dev/null +++ b/full_models/alt/vocab.txt @@ -0,0 +1,46 @@ +| +а +е +р +ы +н +л +и +к +д +о +т +у +г +б +с +й +п +ј +ӱ +ҥ +м +ч +з +ӧ +ж +ш +э +– +- +в +х +ф +я +ь +1 +2 +ц +ю +ÿ +4 +r +j +6 +0 + diff --git a/full_models/alz/D_100000.pth b/full_models/alz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f298f90aec709b4e949f21bce38024a57d5be14b --- /dev/null +++ b/full_models/alz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:524f394898e2b1b94c729fb1bc853b27fa3718a8b727dab8e829d8cf23657563 +size 561078859 diff --git a/full_models/alz/G_100000.pth b/full_models/alz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..38493993864d614735e923e0e2d090d8dee4d1d9 --- /dev/null +++ b/full_models/alz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aadb692689fcb178e990062b9c28b1c813f14cbd634b8aba222732e063e7b075 +size 436358081 diff --git a/full_models/alz/config.json b/full_models/alz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/alz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/alz/vocab.txt b/full_models/alz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ce9a6b346785f479f11553eca17391b47697d75c --- /dev/null +++ b/full_models/alz/vocab.txt @@ -0,0 +1,27 @@ +| +a +i +e +n +u +o +m +k +g +d +w +r +t +b +c +y +l +' +h +p +j +s +f +v +z + diff --git a/full_models/ame/D_100000.pth b/full_models/ame/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d330b877fab0aa246c2813188ba98c998c5b921d --- /dev/null +++ b/full_models/ame/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d5951b6a4c6524d33140a153ebf43daa5b1f6de4db1a07fa51c5a6006ea853 +size 561098185 diff --git a/full_models/ame/G_100000.pth b/full_models/ame/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a7b8bc7407ad956a87d5af62ff5ecc243cc16abd --- /dev/null +++ b/full_models/ame/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bb7b0f8b40b3dbd796c46190da9bcab2612f80d7c98b68485a313fba04ba718 +size 436538049 diff --git a/full_models/ame/config.json b/full_models/ame/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ame/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ame/vocab.txt b/full_models/ame/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1d2cdc86492abb2ff429c3a907773efb4632a8c2 --- /dev/null +++ b/full_models/ame/vocab.txt @@ -0,0 +1,39 @@ +í +x +i +_ +b +v +y +w +q +n + +p +ë +u +j +ú +ñ +g +r +s +é +t +d +z +c +- +e +a +k +h +ó +o +á +f +— +2 +l +m +' diff --git a/full_models/amf/D_100000.pth b/full_models/amf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1808b7724ad5069375fc5952cca65811eb730a36 --- /dev/null +++ b/full_models/amf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7c7492f7f73872779b8475db9ece5195987b3a95a2ee2bfcc25cefeddfca0d +size 561098185 diff --git a/full_models/amf/G_100000.pth b/full_models/amf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f654f45069cf9642bb01c2d918b2550998272146 --- /dev/null +++ b/full_models/amf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68d6548dacba668fd3093c017a50df5168e6b9eac7af10f9846567d42fdfa81 +size 436512705 diff --git a/full_models/amf/config.json b/full_models/amf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/amf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/amf/vocab.txt b/full_models/amf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5f1d3e54a3120d2c6003570da9230c45a635bd0e --- /dev/null +++ b/full_models/amf/vocab.txt @@ -0,0 +1,28 @@ +z +k +v +a +n +u +x +l +j +p +w +g +h +t +_ +m +s +c +e +y +o + +i +q +r +' +d +b diff --git a/full_models/amh/D_100000.pth b/full_models/amh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0c6fbc9ec25aa0dee23315d56d7d9e2164437d15 --- /dev/null +++ b/full_models/amh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaffc510b505022f64ef7e447d883a5e3fd9717295460b45caeaa81e1e415951 +size 561110607 diff --git a/full_models/amh/G_100000.pth b/full_models/amh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81740854fbacd6306ecadcbfa38b3c85c5ae0e1a --- /dev/null +++ b/full_models/amh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:290df5a11be019a427cefca18cd3bea4b644a8788e61fb6adb06f2377d9db0e4 +size 436596679 diff --git a/full_models/amh/config.json b/full_models/amh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..993d1dedb1d0c8e820b98f9e2f019ff166327038 --- /dev/null +++ b/full_models/amh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.uroman", + "validation_files": "dev.uroman", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/amh/vocab.txt b/full_models/amh/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..59fcb3668654565a9b6ddde9b45e26d542af6e45 --- /dev/null +++ b/full_models/amh/vocab.txt @@ -0,0 +1,28 @@ +c +_ +l +f +p +e +m +j +r +h +o +z + +s +' +t +n +u +q +b +w +a +k +x +i +y +d +g diff --git a/full_models/ami/D_100000.pth b/full_models/ami/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5f49201c06ce2dd6dcf6e82a970ebd4c8337e36e --- /dev/null +++ b/full_models/ami/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d023f0b4ca877caf8f85218b5c7f5a1a3c3145d2a7f882358c7ed5cc8062b7 +size 561110531 diff --git a/full_models/ami/G_100000.pth b/full_models/ami/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b111ef6930255f4ec367242c68c0b7611bf80f3c --- /dev/null +++ b/full_models/ami/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4c9c6c17600cad42f0657e4b2ab94b3ab5320fdb2f4bd16cea81f81f589bd61 +size 436591723 diff --git a/full_models/ami/config.json b/full_models/ami/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ami/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ami/vocab.txt b/full_models/ami/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4ed52000213ebf3db387d5fa31ef405dac98319b --- /dev/null +++ b/full_models/ami/vocab.txt @@ -0,0 +1,26 @@ +a +| +o +n +i +k +t +m +y +s +r +l +w +c +p +g +d +' +h +e +f +u +x +0 +- + diff --git a/full_models/amk/D_100000.pth b/full_models/amk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1e66aa65142d0cd73b7aecbc8902df6848bb6c4 --- /dev/null +++ b/full_models/amk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a086bd4cd95bb86e324d492a5aa60326e11052472c3d8a8e6b0c39fdfff6eaf +size 561098185 diff --git a/full_models/amk/G_100000.pth b/full_models/amk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d272ed55ce81677b1ab0148ebaba45eb79e7125b --- /dev/null +++ b/full_models/amk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3006bc9822cccdcb2e88d66bf895a14c0c859a091ebc0a7330b7a6a3e9f2edb +size 436528833 diff --git a/full_models/amk/config.json b/full_models/amk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/amk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/amk/vocab.txt b/full_models/amk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..498fec475f498ae2d7932d81028ceb6ae6afb89a --- /dev/null +++ b/full_models/amk/vocab.txt @@ -0,0 +1,35 @@ +h +z +e +o +2 +a +u +_ +- +j +' +g + +p +d +c +l +0 +t +w +3 +— +6 +y +k +f +m +i +1 +b +7 +n +r +4 +s diff --git a/full_models/ann/D_100000.pth b/full_models/ann/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d2f019fb804bd85a3751d1a1559427de701bb77d --- /dev/null +++ b/full_models/ann/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f14c7a382f3ed9b95c8d6f9d0c4fc694aa30c6fc0794e7b12776e25b39d3a900 +size 561078598 diff --git a/full_models/ann/G_100000.pth b/full_models/ann/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..136516793fcf3319860b2078de90ce2eda4dafaa --- /dev/null +++ b/full_models/ann/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f268aa5d3254092da8e36de45bbc014c6af8425029d2e5177209fb82e244aa18 +size 436382891 diff --git a/full_models/ann/config.json b/full_models/ann/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ann/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ann/vocab.txt b/full_models/ann/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a588477c29ffa1d306ed19e931821c36ef061c9a --- /dev/null +++ b/full_models/ann/vocab.txt @@ -0,0 +1,40 @@ +| +e +i +a +n +k +u +m +ọ +b +o +t +̄ +y +g +r +w +s +j +l +p +è +ì +h +c +f +ò +î +d +- +ô +ǹ +ê +â +̀ +à +ù +' +û + diff --git a/full_models/any/D_100000.pth b/full_models/any/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0f7798539882e1a05aa6d4faeef9c1eab9f925a7 --- /dev/null +++ b/full_models/any/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a084bfc5cdf99abad573b1c3b48654b40a90dd7c327e2850945d16a1602c3f0 +size 561098185 diff --git a/full_models/any/G_100000.pth b/full_models/any/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..57eaa5f3db28035d65e8d7f264673e7b255e5410 --- /dev/null +++ b/full_models/any/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23705518fdbf36e917b21b417795f7f136620fbecb326f31cf217fca97342377 +size 436538049 diff --git a/full_models/any/config.json b/full_models/any/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/any/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/any/vocab.txt b/full_models/any/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..251a714a2366b265af343d88bad4b52f4a942557 --- /dev/null +++ b/full_models/any/vocab.txt @@ -0,0 +1,39 @@ +ʋ +í +m +ó +a +t +u +ɛ +̂ +ú +c +ɔ +' +́ +á +_ +l +d +y +p +b +é +g +n +j +v +â +s +f +e + +k +ɩ +i +z +o +- +w +h diff --git a/full_models/aoz/D_100000.pth b/full_models/aoz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e9eae8658556cd575da2d848f43adf2e2990489 --- /dev/null +++ b/full_models/aoz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4913ed82f28a36ebc0629e85625de0e6c398fe9d4f5961e237ac55c69a541e0f +size 561076032 diff --git a/full_models/aoz/G_100000.pth b/full_models/aoz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa02539e25cf4cd68e5357b63337a9bab9899428 --- /dev/null +++ b/full_models/aoz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb57a682be3e66a57976fbfd1c54624d1c6c8d1d507bfb06a8e8e3a8d909294 +size 436326748 diff --git a/full_models/aoz/config.json b/full_models/aoz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/aoz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/aoz/vocab.txt b/full_models/aoz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..422e66602b282d6637fb9c05dcd9ea13af1ad52d --- /dev/null +++ b/full_models/aoz/vocab.txt @@ -0,0 +1,24 @@ +| +a +n +i +e +s +u +o +m +l +t +k +' +h +f +b +g +p +y +j +- +r +d + diff --git a/full_models/apb/D_100000.pth b/full_models/apb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..429e3fbec61fd9929c4036bf6191ed05ed466c8d --- /dev/null +++ b/full_models/apb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:085dddd2ee8a504d02c70953f6a3c51e9c36a034738117c09d99254c59978c6c +size 561076941 diff --git a/full_models/apb/G_100000.pth b/full_models/apb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5590dd2879a6073f0c8f93dc7c187183080f6e1 --- /dev/null +++ b/full_models/apb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42572e20086f1c1374cfc325a43040dadd3a8ac7ab724dab4c8016a4d871d14a +size 436378176 diff --git a/full_models/apb/config.json b/full_models/apb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/apb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/apb/vocab.txt b/full_models/apb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e2b8659c6bcc80042b78d1aa9a3c4d061eb1be7d --- /dev/null +++ b/full_models/apb/vocab.txt @@ -0,0 +1,38 @@ +| +a +e +i +o +n +u +l +m +ꞌ +k +h +t +r +g +s +w +d +p +- +j +b +1 +v +2 +3 +f +5 +4 +6 +8 +9 +0 +7 +— +' +z + diff --git a/full_models/apr/D_100000.pth b/full_models/apr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91eb2baf6b249ab8967604a7677373c824d4f5bc --- /dev/null +++ b/full_models/apr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b33bd2a1b532b191f630482e8e25361eb0c50214051bee927e285993674000d +size 561098185 diff --git a/full_models/apr/G_100000.pth b/full_models/apr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e6dd690d9067def9da7f6a1ded9e36568c33ab1b --- /dev/null +++ b/full_models/apr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0edbcbdc4fdc6b62e2cd543e61f4da1a74f8699e4325e9b0fd4c8106d8b4dd +size 436519617 diff --git a/full_models/apr/config.json b/full_models/apr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/apr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/apr/vocab.txt b/full_models/apr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..94dd9d7305656ddaf39af1864fb0b10c63186dc6 --- /dev/null +++ b/full_models/apr/vocab.txt @@ -0,0 +1,31 @@ +3 +n +y +r +9 +d +l +k +4 + +2 +6 +' +s +_ +a +1 +i +t +p +o +7 +w +5 +u +b +g +8 +e +0 +m diff --git a/full_models/ara/D_100000.pth b/full_models/ara/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..96b5db785da8ce14d5bd667b18415a0fba8e6aa2 --- /dev/null +++ b/full_models/ara/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de921c4d12276246985a3417a09fc3954dd01a0a7c030e94d4233d2516265070 +size 561110755 diff --git a/full_models/ara/G_100000.pth b/full_models/ara/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a44d03c660064d6029f5746878f590df23c0e5c5 --- /dev/null +++ b/full_models/ara/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7efa6717dc90ad7db7895e17210a946d32297fd3b6ac42291f27eb7f333b5b7c +size 436623138 diff --git a/full_models/ara/config.json b/full_models/ara/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ara/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ara/vocab.txt b/full_models/ara/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..d1be48458cd2285ede825d5c2fc1efe5245d7ec3 --- /dev/null +++ b/full_models/ara/vocab.txt @@ -0,0 +1,39 @@ +ا +ن +ك +ع +إ +غ +ذ +ة +س +ر +ط +خ +ت +ج +ظ +ي +د +– +ص +ث +أ +ى +ض +ح +ه + +ء +آ +ب +و +م +ل +ش +ق +ز +ؤ +ف +_ +ئ diff --git a/full_models/arl/D_100000.pth b/full_models/arl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..96ceb14d31b26567eeb5f97d9ed8e75c9bdd0b10 --- /dev/null +++ b/full_models/arl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616fce371e6b73243b09ca00ac310f38332394a355f08244cba098b1e8e85aaa +size 561098185 diff --git a/full_models/arl/G_100000.pth b/full_models/arl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..717c8ae9f33168beb6a1838b4f9fc5c84a0f384e --- /dev/null +++ b/full_models/arl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee2a733df767e297f8d726ed1bb608db38baca3038a4693ed81aaca8441f43a8 +size 436526529 diff --git a/full_models/arl/config.json b/full_models/arl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/arl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/arl/vocab.txt b/full_models/arl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cbd23864925a1e9d45edb4708d97646031e02df3 --- /dev/null +++ b/full_models/arl/vocab.txt @@ -0,0 +1,34 @@ +d +i +n +x +o +v +s +' +h +é +r +e +y +b +g +t +k + +ó +_ +l +í +c +á +a +— +q +u +z +ú +f +j +p +m diff --git a/full_models/asa/D_100000.pth b/full_models/asa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d612ddf19953c115501dc7e243c7f08b21c6a86c --- /dev/null +++ b/full_models/asa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ae94f65de979c76df87393a7ebd5e57eb3497a0b8b681409b481328d27d61b +size 561098185 diff --git a/full_models/asa/G_100000.pth b/full_models/asa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a92c064a5923be2c39c26de5db7afbc2f629d0f3 --- /dev/null +++ b/full_models/asa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc59e64fa40c7516e5876b2490c70db4c9d472ed90c99883f44e42790b78d716 +size 436512705 diff --git a/full_models/asa/config.json b/full_models/asa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/asa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/asa/vocab.txt b/full_models/asa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..496448d2f597d7247eed9f59390e8ab8c03e85d1 --- /dev/null +++ b/full_models/asa/vocab.txt @@ -0,0 +1,28 @@ +z +m +w +_ +- +p +b +t +e +y + +i +f +a +c +u +n +o +l +v +r +g +j +s +k +d +h +' diff --git a/full_models/asg/D_100000.pth b/full_models/asg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b08461fd277174afc0eb35e5aa4ca5fd724652fb --- /dev/null +++ b/full_models/asg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d33b4042849a646bfe671fae1c5141f5d8d40650b839e933d19ba29907210f48 +size 561078065 diff --git a/full_models/asg/G_100000.pth b/full_models/asg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f0f7d740919de08bf93f17fb7a5e64f2942035e4 --- /dev/null +++ b/full_models/asg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953a601a66fbbec550a5c1f60bc0efc9d5fd32861b60097813634d18567ef9ba +size 436358080 diff --git a/full_models/asg/config.json b/full_models/asg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/asg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/asg/vocab.txt b/full_models/asg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e4b15fdec3f0b61d90e9b02d11b55c967309568e --- /dev/null +++ b/full_models/asg/vocab.txt @@ -0,0 +1,32 @@ +| +a +i +u +n +k +̱ +e +m +s +t +o +y +l +ɗ +b +g +v +d +h +w +p +c +ꞌ +z +r +f +ɓ +j +- +' + diff --git a/full_models/asm/D_100000.pth b/full_models/asm/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..29053cc07b22bde43eff0b6b49ef38ad5b1c4940 --- /dev/null +++ b/full_models/asm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4269ed32d44b9d30271a49caf3fd97f5e6d386198abf97c959e6577343763cda +size 561079135 diff --git a/full_models/asm/G_100000.pth b/full_models/asm/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..667f88e4286f97e44a17b9de81e9442b00c079a0 --- /dev/null +++ b/full_models/asm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47ad2b61a92e6857438064b6a2c21d4f7d252fc5bf99afaa02adf969eef511af +size 436445810 diff --git a/full_models/asm/config.json b/full_models/asm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/asm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/asm/vocab.txt b/full_models/asm/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..57faf47a6b7be879f615c4c89e59e2a2ae1a9240 --- /dev/null +++ b/full_models/asm/vocab.txt @@ -0,0 +1,66 @@ +| +ৰ +া +ক +ে +ি +ত +ন +্ +ল +ো +য +ব +প +ম +ু +স +আ +হ +় +ই +দ +ঁ +ও +জ +ী +শ +চ +ৈ +গ +ৱ +ছ +এ +ধ +থ +ষ +ভ +অ +ণ +খ +' +ট +র +ূ +ঈ +উ +ৃ +- +ঠ +ঘ +ফ +ং +ঞ +ড +ৌ +ৎ +ঙ +ঢ +ঃ +ঐ +ঋ +0 +2 +— +‍ + diff --git a/full_models/ata/D_100000.pth b/full_models/ata/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..efae77aa0080aba9329524194642384425d135e2 --- /dev/null +++ b/full_models/ata/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b15ae3b5148230079187eede85a9dab464b5a1c864249e735bce1819808b49f +size 561098185 diff --git a/full_models/ata/G_100000.pth b/full_models/ata/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2936e1613fd32d987cc16714c3c1894232010cf9 --- /dev/null +++ b/full_models/ata/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b7cbd602d5128b5fc4fbfda70b5bf0c9739588521e2d66b90152827fc818306 +size 436524225 diff --git a/full_models/ata/config.json b/full_models/ata/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ata/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ata/vocab.txt b/full_models/ata/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d8ea470aba46f88ec12765479c5b2e39768a0990 --- /dev/null +++ b/full_models/ata/vocab.txt @@ -0,0 +1,33 @@ +' +i +7 +u +v +_ +b +p +z +d +r +1 +f +– +o +h +g +t +0 + +a +k +- +6 +m +4 +l +2 +5 +e +n +s +x diff --git a/full_models/atb/D_100000.pth b/full_models/atb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7bbd3f848fa6656cfe52afc266bcb014ee895f5b --- /dev/null +++ b/full_models/atb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:895874c28a12b0879d6209ffef7df15ea957f5cd3128e610fe079aa63e0ced5e +size 561098185 diff --git a/full_models/atb/G_100000.pth b/full_models/atb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bd6f20bdf3633127515618a31428e2745e284d85 --- /dev/null +++ b/full_models/atb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5f0c19f1fad38151bd874129a1bfd878730361d65409e14b3adeb03d083bd86 +size 436563393 diff --git a/full_models/atb/config.json b/full_models/atb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/atb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/atb/vocab.txt b/full_models/atb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..acb63a02994a9540912a14ab0a2b3e1a2a6ccfdf --- /dev/null +++ b/full_models/atb/vocab.txt @@ -0,0 +1,50 @@ +_ +s +c +î +4 +z +ò +q +à +ù +- +0 +x +ê +o +u +' +ú +n +k +r +w +‐ +é +j +è +y +g +a +á +ô +i +b +h +m +e +t +8 +l +6 +í +p +ó +1 +ì +û + +d +â +2 diff --git a/full_models/atg/D_100000.pth b/full_models/atg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4621e677472726b1471dc548b2da0088eae38dfe --- /dev/null +++ b/full_models/atg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b67361284137af465421cc8fc21e0f877ef9bdbf94190cb78a669cbecd566e +size 561098185 diff --git a/full_models/atg/G_100000.pth b/full_models/atg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d455d22f0ecc1273f37c8482590dbcc701e857e3 --- /dev/null +++ b/full_models/atg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6eee79ed6367fc3914d786f9587385e75cbd7d8a6f0ee41e2995f8b7dd46480 +size 436563393 diff --git a/full_models/atg/config.json b/full_models/atg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/atg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/atg/vocab.txt b/full_models/atg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1b7f8244ca525f531afa8ae22f7a766380846fa1 --- /dev/null +++ b/full_models/atg/vocab.txt @@ -0,0 +1,50 @@ +g +l +y +b +h +v +1 +d +z +o +̀ +4 +_ +ú +t + +i +ó +0 +s +á +3 +ò +̌ +m +w +p +̄ +u +ọ +é +7 +ẹ +́ +k +a +n +- +ā +2 +è +f +à +6 +e +j +c +r +' +ù diff --git a/full_models/ati/D_100000.pth b/full_models/ati/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..15ab3115dd2a7ad62909bec8e5f3ba3f60cc74c8 --- /dev/null +++ b/full_models/ati/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4f0483443cad56fdcedd16ea7c633ee832eeeb055f762a0c30c6091b02e6f6 +size 561078976 diff --git a/full_models/ati/G_100000.pth b/full_models/ati/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a2b522afc92b02e53b75118e4e340127d5d47a5d --- /dev/null +++ b/full_models/ati/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01008e43083bc0f48e9a90bc46af1051878d8d21158e2d9f769d91779c64f84b +size 436365592 diff --git a/full_models/ati/config.json b/full_models/ati/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ati/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ati/vocab.txt b/full_models/ati/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7977571010ec658116138ab86298be0ff43b4b63 --- /dev/null +++ b/full_models/ati/vocab.txt @@ -0,0 +1,31 @@ +| +' +n +a +ɛ +i +k +e +b +u +ɔ +h +m +s +l +ö +z +y +o +p +ë +t +f +d +w +g +r +j +v +c + diff --git a/full_models/atq/D_100000.pth b/full_models/atq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f342d5fe641dec45e965b0c34dce21a0574d03f3 --- /dev/null +++ b/full_models/atq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e523443d7cae9bf04bf5e141cb200338eba41a1fbedae72c75d2d0154252c2cf +size 561098185 diff --git a/full_models/atq/G_100000.pth b/full_models/atq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b81bd44bd2254c8b91e6b6fa66877ba4e09424e3 --- /dev/null +++ b/full_models/atq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ad90b7a004e72003e45ac6dcb298336605bf021e3bb32255cc5c9365201edc0 +size 436512705 diff --git a/full_models/atq/config.json b/full_models/atq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/atq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/atq/vocab.txt b/full_models/atq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1717dc76394e3258d064db34d4c53f84ee4c990d --- /dev/null +++ b/full_models/atq/vocab.txt @@ -0,0 +1,28 @@ +l +w +o +n +a +' +r +j +b +d +m +f +p +c +e +- +k +u +i +s +_ +y + +g +h +ä +z +t diff --git a/full_models/ava/D_100000.pth b/full_models/ava/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7e1e6c678b8a55ddfa2aac6dd45c5c5b493133e9 --- /dev/null +++ b/full_models/ava/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d39a795c094415cb3c0ad4a12a7892bfe06537f5e5809d8287e1b91f9456d54 +size 561098185 diff --git a/full_models/ava/G_100000.pth b/full_models/ava/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d28dfaaf4064afa10521ff8a4e38d624e5fe8ed5 --- /dev/null +++ b/full_models/ava/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e313bbdab0702807a4ddba7d1ca413f8422a0d722b3cb52479d40dbb4090f90e +size 436533441 diff --git a/full_models/ava/config.json b/full_models/ava/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ava/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ava/vocab.txt b/full_models/ava/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c2e20ffd8cb6856b8fa3cea6e62625fd286af853 --- /dev/null +++ b/full_models/ava/vocab.txt @@ -0,0 +1,37 @@ +о +н +п +х +- +з +ъ +э +ж +ю +ӏ +м +л +д +я +б +г +с +у +ь +_ +е +– +й +в +ч +ф +щ +ё +т +и +к +ш + +а +р +ц diff --git a/full_models/avn/D_100000.pth b/full_models/avn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5b983b482c975a846e32e682511bac8df5ca6ebe --- /dev/null +++ b/full_models/avn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c40c006e3c862d6f9c8438c4e87184b2f8e1b10e0a8738858ac3bb2605d04330 +size 561098185 diff --git a/full_models/avn/G_100000.pth b/full_models/avn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..af37dda865af0d79d92a36081cf13fdef8ce06a1 --- /dev/null +++ b/full_models/avn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecfda39f7f68c21e69de6d56d24e218bc6038cab5a575e0d1311454b4af1d3c +size 436561089 diff --git a/full_models/avn/config.json b/full_models/avn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/avn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/avn/vocab.txt b/full_models/avn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..75cc584b7fc802a5bdc9fee65a1adf0fffae0d77 --- /dev/null +++ b/full_models/avn/vocab.txt @@ -0,0 +1,49 @@ +x +d +i +í +ʋ +s +á +y +̀ +w +o +ũ +k +' +ɛ +é +u +r +ƒ +e +ò +ú +m +t +n +h +ì +ù +è +ɖ +ŋ +ɔ +z +g +́ +à +c +_ +v +l +p +f +ĩ +b +ó +ã + +a +̃ diff --git a/full_models/avu/D_100000.pth b/full_models/avu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..16210ceb2579d23fa142749d9c280eebcf8cee6f --- /dev/null +++ b/full_models/avu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe382c662693272aeb702e98a443f4e3c0f3fb3145a001c5e893aff984b0bcfa +size 561076180 diff --git a/full_models/avu/G_100000.pth b/full_models/avu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ce0fd3b8fb3b78cf7dccc63de381a08353b6d7a1 --- /dev/null +++ b/full_models/avu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22cf1fa2c0f44dbe2e2ed51cc15556f7db9a6f382f8402b0e07ce0849c714f13 +size 436404160 diff --git a/full_models/avu/config.json b/full_models/avu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/avu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/avu/vocab.txt b/full_models/avu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ba780cad86f4280332f47d8403796e69d11548c2 --- /dev/null +++ b/full_models/avu/vocab.txt @@ -0,0 +1,57 @@ +| +r +ʼ +á +ã +l +â +d +î +ĩ +í +n +t +ó +õ +g +y +b +k +ị +é +ô +s +m +̃ +z +́ +ẽ +j +v +ê +ạ +ú +ũ +p +̂ +- +f +û +c +ậ +w +ṇ +' +1 +2 +h +4 +3 +5 +8 +6 +9 +0 +7 +i + diff --git a/full_models/awa/D_100000.pth b/full_models/awa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fca76c9c1331c0cf9fc0dc6dded611bd4c09759b --- /dev/null +++ b/full_models/awa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9315300f22a3a805e6b0f8dc09335bfec998067d62720029e0712242cc7eba6b +size 561078847 diff --git a/full_models/awa/G_100000.pth b/full_models/awa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d91a7f7a46f4c55b29bda9cf537cc685f34d556c --- /dev/null +++ b/full_models/awa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d62a9ee9568c14572d146b0ebd2e65b474b29ad0de23c46b95bb91999246787 +size 436474239 diff --git a/full_models/awa/config.json b/full_models/awa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/awa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/awa/vocab.txt b/full_models/awa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8a41754d812d6fbc79f2bcf79141b0a5dc9f03df --- /dev/null +++ b/full_models/awa/vocab.txt @@ -0,0 +1,78 @@ +| +ा +क +र +ह +न +स +े +त +म +ि +इ +उ +ब +प +् +ी +अ +ज +ल +ो +ँ +व +द +य +ू +ु +ग +च +ओ +ं +आ +भ +ख +ए +ई +ट +ध +छ +ड +़ +फ +थ +ठ +ण +ौ +घ +ढ +झ +ै +ऊ +ऍ +- +ृ +ऩ +ॅ +ञ +ः +ॉ +' +0 +ष +ऐ +श +1 +2 +औ +ऋ +6 +4 +9 +ऎ +7 +ऱ +i +3 +5 + diff --git a/full_models/awb/D_100000.pth b/full_models/awb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c50bde709ba9e2939b8e227a4bbbee1dae6cf322 --- /dev/null +++ b/full_models/awb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a751b238c5ef3d0c56bfb476993d311d025f185f3ae40b3b7cab402805b65341 +size 561078507 diff --git a/full_models/awb/G_100000.pth b/full_models/awb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c766f83e6d4c797531b4b42d43c081b735e38f9a --- /dev/null +++ b/full_models/awb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621913cd488e7a8c469e4777ae986c4605f3cda49f9fc64955654d0be635f891 +size 436371390 diff --git a/full_models/awb/config.json b/full_models/awb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/awb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/awb/vocab.txt b/full_models/awb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ebab784d722469643f9e56902497b1e272e4017d --- /dev/null +++ b/full_models/awb/vocab.txt @@ -0,0 +1,35 @@ +| +a +e +n +r +h +i +á +w +é +í +m +k +t +s +q +o +b +u +g +p +ó +ú +y +0 +1 +2 +4 +5 +3 +7 +6 +8 +9 + diff --git a/full_models/ayo/D_100000.pth b/full_models/ayo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e730ba32a8f03e964d9c751de33983179cd77e0f --- /dev/null +++ b/full_models/ayo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ed4ae1f15a4a48e45552ede00c654fa179e250a6b22634d76f430d5874bfc34 +size 561098185 diff --git a/full_models/ayo/G_100000.pth b/full_models/ayo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c1ac0942a009298237ddb94ad6573a86a75b3949 --- /dev/null +++ b/full_models/ayo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7969d0e86fe65b86fd4bb9cec83b5501a1f6042b8ea48e07f381c29e78bdf21 +size 436579521 diff --git a/full_models/ayo/config.json b/full_models/ayo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ayo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ayo/vocab.txt b/full_models/ayo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6f8e7ef9165ebaf84590c95dcb3f98cccf625c74 --- /dev/null +++ b/full_models/ayo/vocab.txt @@ -0,0 +1,57 @@ +0 +c +z +ñ +j + +ẽ +v +a +ṍ +q +4 +ó +­ +2 +_ +̃ +õ +7 +y +6 +o +í +ã +b +- +t +s +ú +́ +– +u +1 +g +r +d +3 +ṹ +5 +x +9 +p +l +k +m +n +e +ũ +8 +h +ı +é +á +i +f +ĩ +' diff --git a/full_models/ayr/D_100000.pth b/full_models/ayr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dd6351bc280999c58fa7fa9f9ba4ae3d4b2e86a0 --- /dev/null +++ b/full_models/ayr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c20da2c9c65833befb24678df0356e73e5698e938457ba0676aadc2a2e17a70a +size 561078877 diff --git a/full_models/ayr/G_100000.pth b/full_models/ayr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bc75db6e1ac30180a087c889784cc9115fe06589 --- /dev/null +++ b/full_models/ayr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88b894654aff3d12bbdfe719cbd75423c67fae29a5adcc64d51e8f32d877984 +size 436388174 diff --git a/full_models/ayr/config.json b/full_models/ayr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ayr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ayr/vocab.txt b/full_models/ayr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24edecfac0881010517777e4720e0545e19ee73a --- /dev/null +++ b/full_models/ayr/vocab.txt @@ -0,0 +1,41 @@ +a +| +i +t +k +n +u +s +p +r +m +j +x +h +w +y +q +c +l +ä +ñ +' +o +e +d +ï +— +b +g +f +ü +v +í +é +ó +z +á +ö +ú +ë + diff --git a/full_models/ayz/D_100000.pth b/full_models/ayz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9ffeb2474a18a907bc281e5b4daeaba1b0c10e34 --- /dev/null +++ b/full_models/ayz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784c975216b17180e2d646553a459b591db3a8cf052191e3699e33408e7047da +size 561098185 diff --git a/full_models/ayz/G_100000.pth b/full_models/ayz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d15e1de931d1cfbd9f866b9f8676bf5d17bceb7 --- /dev/null +++ b/full_models/ayz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6afd1afe7546d9a9ff120667719aeb1bead5f870c9cca1e4d8a7639b897e269f +size 436540353 diff --git a/full_models/ayz/config.json b/full_models/ayz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ayz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ayz/vocab.txt b/full_models/ayz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cee9ccd90bbfc03f6d8fc62c057fe618bc0bfbf2 --- /dev/null +++ b/full_models/ayz/vocab.txt @@ -0,0 +1,40 @@ +2 +a +f +9 +r +u +_ +m +d +5 +j +s +4 +7 +e +o +b + +p +6 +n +' +t +ʼ +y +i +l +z +- +g +c +h +0 +õ +v +1 +w +8 +3 +k diff --git a/full_models/azb/D_100000.pth b/full_models/azb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e408c2392f813ee9ec9827979ae2b34b762f4fba --- /dev/null +++ b/full_models/azb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d3dbfbac01becb1cf11e1ddcd61805e0415859407d1f55093619507c76ca1b +size 561098185 diff --git a/full_models/azb/G_100000.pth b/full_models/azb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a3f93b666b4004bbb312cb3839939ad21b3a979 --- /dev/null +++ b/full_models/azb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a36bfbaf14729a1f98576ca946efd05edfc24d7356342c738806d0002163f21 +size 436538049 diff --git a/full_models/azb/config.json b/full_models/azb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/azb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/azb/vocab.txt b/full_models/azb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..992cad17a241a9c5adf30b3b3194a20f0af4d72d --- /dev/null +++ b/full_models/azb/vocab.txt @@ -0,0 +1,39 @@ +ن +ت +- +ص +پ +ث +ه +گ +ح +ا +آ +ک +ع +أ +خ +س +م +ؤ +ل +و +ئ +ی +_ +ر +ژ +غ +ج +د +ظ +ذ +ب +ق +چ + +ط +ض +ش +ز +ف diff --git a/full_models/azg/D_100000.pth b/full_models/azg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8c3826300d6b42081d79d0acad06c1666f18a347 --- /dev/null +++ b/full_models/azg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9daaa2ab2c7928a4fc7c1f97432927ab8096d8a54b465e5193e9a855b0c44f13 +size 561098185 diff --git a/full_models/azg/G_100000.pth b/full_models/azg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f1a52806e02fb4d8b3379f227821e8f2f856783 --- /dev/null +++ b/full_models/azg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5289fd28abfcc4299168f1decd7a27b1cfee82b0319560e7946ae36942f83421 +size 436538049 diff --git a/full_models/azg/config.json b/full_models/azg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/azg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/azg/vocab.txt b/full_models/azg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ed7f26052fe01dcf299a4b71e636b1602c9c6e68 --- /dev/null +++ b/full_models/azg/vocab.txt @@ -0,0 +1,39 @@ +ú +k +í +' +n +v +l +ö +_ +z +t +o +x +ñ +y +q +ü +s +ë +́ +— +é +a +u +e +g +m +j +c +ó +á +i +b +f + +p +r +h +d diff --git a/full_models/azj-script_cyrillic/D_100000.pth b/full_models/azj-script_cyrillic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ec43f61e665f879541ec746c12a401e4d2eedfa6 --- /dev/null +++ b/full_models/azj-script_cyrillic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2093c291cce64701d5807b936dbb736f4c621d6bb258f08441e691d850d39df2 +size 561078234 diff --git a/full_models/azj-script_cyrillic/G_100000.pth b/full_models/azj-script_cyrillic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..68a9e93c857a6cbf591bd650263182dee0b0ae21 --- /dev/null +++ b/full_models/azj-script_cyrillic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ef0479a620ce28e826580c2e3c7b71776481f36886b251782385c19cbc6145 +size 436373147 diff --git a/full_models/azj-script_cyrillic/config.json b/full_models/azj-script_cyrillic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/azj-script_cyrillic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/azj-script_cyrillic/vocab.txt b/full_models/azj-script_cyrillic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f2906cfe66d9f137a7c4de45b17925c07ef719de --- /dev/null +++ b/full_models/azj-script_cyrillic/vocab.txt @@ -0,0 +1,37 @@ +| +а +ж +и +н +р +л +д +э +м +с +ј +з +б +у +т +е +ь +о +к +г +һ +ю +в +ц +ҝ +х +ҹ +п +ф +- +– +0 +1 +2 +4 + diff --git a/full_models/azj-script_latin/D_100000.pth b/full_models/azj-script_latin/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f93cd2e1c2876e7c678c3ac940b1f1fa19993b4c --- /dev/null +++ b/full_models/azj-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28b30c8e85f550e8b6ab27bf2f3dfa26d2d8b4a43a317c5c71093a2fe21239b +size 561079351 diff --git a/full_models/azj-script_latin/G_100000.pth b/full_models/azj-script_latin/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..911d6d2b3566c78c4cf127f9dcc461302693a358 --- /dev/null +++ b/full_models/azj-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:558a397af2d25c42128884ba7879ee7ec1e0f0138bb3a20f845bb9d92dca7c2e +size 436393556 diff --git a/full_models/azj-script_latin/config.json b/full_models/azj-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/azj-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/azj-script_latin/vocab.txt b/full_models/azj-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0d31a4b2b2bbab44e0f0ce23c7fbc2957d210afd --- /dev/null +++ b/full_models/azj-script_latin/vocab.txt @@ -0,0 +1,42 @@ +1 +t +6 +s +ç + +ğ +_ +e +2 +ü +x +m +n +d +v +b +q +z +k +ö +0 +p +– +g +j +a +i +u +ş +c +l +ı +4 +̇ +o +ə +h +f +- +r +y diff --git a/full_models/azz/D_100000.pth b/full_models/azz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ea56f86fb99850285908278d1898d56743859b1 --- /dev/null +++ b/full_models/azz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:255f628a3bbc3098a0c828257521a763e2fca8a17d946ace71ac1fa2554fa1bd +size 561076185 diff --git a/full_models/azz/G_100000.pth b/full_models/azz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aad506a75c06a27ccd4965faf391e0fb25e70559 --- /dev/null +++ b/full_models/azz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4d13e6f6ddb532780adbc74532624ffe3389b648d32a291702f3f9a185959b4 +size 436349019 diff --git a/full_models/azz/config.json b/full_models/azz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/azz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/azz/vocab.txt b/full_models/azz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1a6fb321503f47ce25858cae69c3010688569d29 --- /dev/null +++ b/full_models/azz/vocab.txt @@ -0,0 +1,33 @@ +| +a +i +n +u +e +t +c +o +h +j +m +s +l +q +y +p +d +z +í +r +x +ó +b +g +ú +á +é +f +v +ñ +k + diff --git a/full_models/bak/D_100000.pth b/full_models/bak/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..92b13fab184e9f15e5209c2d2e19acad99d13965 --- /dev/null +++ b/full_models/bak/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b6155e728678f3be20993a62e12da66f4ce0317b0552a87823a261e86fc26b +size 561098185 diff --git a/full_models/bak/G_100000.pth b/full_models/bak/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a1be5fb802349168ed3bd7660e992b2df1491bd --- /dev/null +++ b/full_models/bak/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df6bccc72a5fe2579bf729977fd42405f6a9be0b23e5890827f0443ab63904e5 +size 436556481 diff --git a/full_models/bak/config.json b/full_models/bak/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bak/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bak/vocab.txt b/full_models/bak/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c8d5b03d6d7114ce28a4a471cd5614949df06966 --- /dev/null +++ b/full_models/bak/vocab.txt @@ -0,0 +1,47 @@ +ш +з +м +ц +ж +е +ь +й +я +_ +- +в +ю +һ +ч +ъ +ү +a +ҡ +– +т +э +ф +ы +л +ң +и +г +б +о +ҫ +1 +8 +у +п +х +ғ +д +с + +н +ө +р +ә +к +а +ҙ diff --git a/full_models/bam/D_100000.pth b/full_models/bam/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..14c5ad2117d61a92b93c22061291a577d7602292 --- /dev/null +++ b/full_models/bam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:808838b0d4bf721d5fc45b8954f7f9e1d876a442df5155a70e172f4a8b0f3957 +size 561078706 diff --git a/full_models/bam/G_100000.pth b/full_models/bam/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5811e2aab29582c6866d7d48da46cfaae1871ca --- /dev/null +++ b/full_models/bam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3846ab1251d8a4dafd18c05ef066d5960fd753f201e70a1b7a8a318767dd7024 +size 436373580 diff --git a/full_models/bam/config.json b/full_models/bam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bam/vocab.txt b/full_models/bam/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b9477f320c02099b126d5e2258fdaaec0afb2111 --- /dev/null +++ b/full_models/bam/vocab.txt @@ -0,0 +1,36 @@ +| +a +n +i +k +ɛ +e +ɔ +l +u +o +y +m +b +s +w +t +r +d +g +f +j +' +ɲ +c +h +p +z +- +v +ŋ +– +q +1 +8 + diff --git a/full_models/ban/D_100000.pth b/full_models/ban/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..359b2b1138a2f897346262ab1c573015ec04cc3a --- /dev/null +++ b/full_models/ban/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319287a1ab1a731f66ec5b4a6b40dcdd31ac0afa12ee83f95e4d0963d25613fc +size 561078250 diff --git a/full_models/ban/G_100000.pth b/full_models/ban/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7b33d03d387afa8c0003161ed542bc04e87e5d1b --- /dev/null +++ b/full_models/ban/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a394e61ec71bbed91f9af1e4a0d95da58a3b70894089db08e62b9c1aaa407950 +size 436348343 diff --git a/full_models/ban/config.json b/full_models/ban/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ban/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ban/vocab.txt b/full_models/ban/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f90af2db3510a7cf88a06dbfe168d1996684266e --- /dev/null +++ b/full_models/ban/vocab.txt @@ -0,0 +1,25 @@ +a +| +n +i +e +g +s +u +k +t +r +p +d +m +h +l +y +o +w +b +j +c +- +' + diff --git a/full_models/bao/D_100000.pth b/full_models/bao/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..98cc6bd6202423492bd0891ae8b346b911914491 --- /dev/null +++ b/full_models/bao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a706144036391b741750e0459a5eef82c1dddb7d219f6ba861474175d8db0cb +size 561078603 diff --git a/full_models/bao/G_100000.pth b/full_models/bao/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b4c10c02832a578f2f4c932640d45878d3d218a9 --- /dev/null +++ b/full_models/bao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8252693f911d8d4205feec3aaf06b1847c2ead8925a17d57be22a10188375af +size 436394420 diff --git a/full_models/bao/config.json b/full_models/bao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bao/vocab.txt b/full_models/bao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..00b3bceb9ca76b28919b2492560b3f833f392d7b --- /dev/null +++ b/full_models/bao/vocab.txt @@ -0,0 +1,45 @@ +| +a +i +r +e +c +ʉ +o +j +t +m +u +p +n +ã +b +̃ +w +ĩ +ñ +y +d +g +s +q +õ +é +— +l +í +ũ +ú +á +' +ẽ +f +h +ó +v +z +1 +x +k +́ + diff --git a/full_models/bav/D_100000.pth b/full_models/bav/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa720eafbe156b6fa438a8a26ac5f8c59ba9b3a9 --- /dev/null +++ b/full_models/bav/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:489f1a7fc4a71264436c0fec305173f2de80f9b537adbb8210810ea045c58fa6 +size 561078887 diff --git a/full_models/bav/G_100000.pth b/full_models/bav/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4584672251af9078b73fae1113541d975d10154d --- /dev/null +++ b/full_models/bav/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e419f024e1c4c1bc4210051920fc7502ba9db6f3fa850e11c33d63d39b24e7bd +size 436383825 diff --git a/full_models/bav/config.json b/full_models/bav/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bav/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bav/vocab.txt b/full_models/bav/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..176efe1949b4d38cf4f12d918e9aabe78a08e67d --- /dev/null +++ b/full_models/bav/vocab.txt @@ -0,0 +1,40 @@ +| +ə +a +ŋ +i +n +ɨ +w +s +u +v +e +k +t +m +y +ɔ +f +' +l +h +b +g +́ +d +o +ù +̀ +z +j +ì +à +r +- +è +p +ò +ú +̰ + diff --git a/full_models/bba/D_100000.pth b/full_models/bba/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..946d294fbf79b5a206d485a823cb797dc8fc89dc --- /dev/null +++ b/full_models/bba/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf024be2d4c5a093372c895b276e9fd4df94e2db85c847f5b8419351be584b73 +size 561078706 diff --git a/full_models/bba/G_100000.pth b/full_models/bba/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..53faa3c14994a1619b5fa394fc00a142408d252c --- /dev/null +++ b/full_models/bba/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326ed6394358eb1d3dcde669d8f6fbe503e6d0dad768fda4ac16ad42e6f144dc +size 436371968 diff --git a/full_models/bba/config.json b/full_models/bba/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bba/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bba/vocab.txt b/full_models/bba/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6cde200b41872db9921bb92faffb1b3efbae3bbf --- /dev/null +++ b/full_models/bba/vocab.txt @@ -0,0 +1,35 @@ +| +a +u +n +i +ɔ +s +k +b +m +r +e +ɛ +o +w +y +g +d +t +̃ +p +ã +l +ǹ +ĩ +ù +h +f +̀ +à +è +ì +ũ +ò + diff --git a/full_models/bbb/D_100000.pth b/full_models/bbb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0976cfc991e451b39daff73985df19da883e7241 --- /dev/null +++ b/full_models/bbb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429b10887d36aafca394125a70a78506d85d470d3c99a90546bc70230b6cf3a0 +size 561109991 diff --git a/full_models/bbb/G_100000.pth b/full_models/bbb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7497704d1245486f24044e333f861a4e3497a83b --- /dev/null +++ b/full_models/bbb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b9575836fcd10bcc4214385b206b1f25bfcba39f86c0ad6fd10da479ad2466 +size 436578450 diff --git a/full_models/bbb/config.json b/full_models/bbb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bbb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bbb/vocab.txt b/full_models/bbb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..acb9ba546dced3e0783c6b58cd416c9643df04bf --- /dev/null +++ b/full_models/bbb/vocab.txt @@ -0,0 +1,22 @@ +| +e +a +i +u +o +n +r +j +k +f +m +v +b +g +d +s +t +z +- +l + diff --git a/full_models/bbc/D_100000.pth b/full_models/bbc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed9a1fd0f57d7cb08d108e6a00636e5c13be555e --- /dev/null +++ b/full_models/bbc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e1694920ca36d5e474c66cb994f422d3e85b483f1b68315b991525d046a014a +size 561098185 diff --git a/full_models/bbc/G_100000.pth b/full_models/bbc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..270e516601a5d2bb7b80bbca42cad91b53a9ebbb --- /dev/null +++ b/full_models/bbc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a2e62eef0ddecfa952e5b4325a862131d8342941a8481ed0de030e947d1d3b +size 436515009 diff --git a/full_models/bbc/config.json b/full_models/bbc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bbc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bbc/vocab.txt b/full_models/bbc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6c1e943ad709c5c8e9f5021acfa0392796494faf --- /dev/null +++ b/full_models/bbc/vocab.txt @@ -0,0 +1,29 @@ +e +m +f +k +y +w +a +l +t +i +b +o + +h +v +d +u +g +c +j +z +_ +— +é +- +r +n +p +s diff --git a/full_models/bbo/D_100000.pth b/full_models/bbo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b40c290fa2d572d9e3a76c6f89a2582cb10d803 --- /dev/null +++ b/full_models/bbo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5aa690f9cbd891f8f89850afe556b9b437df6accad7ab20c56f139196b505d +size 561098185 diff --git a/full_models/bbo/G_100000.pth b/full_models/bbo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..06d2fd683f87480895fa291afcb39c16f99a54f3 --- /dev/null +++ b/full_models/bbo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9cfcf15be9f43764099654c778f83d82dab357699dc0bee2eaa399607e27577 +size 436528833 diff --git a/full_models/bbo/config.json b/full_models/bbo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bbo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bbo/vocab.txt b/full_models/bbo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f7cea5c2b57c2798dd95fe44cace57614a5de4e3 --- /dev/null +++ b/full_models/bbo/vocab.txt @@ -0,0 +1,35 @@ +ɔ +_ +s +f +g +á +ɩ +ɲ +— +̣ +ʋ +u +n +k +m +h +' +y +e +i +ɛ +w +- +j +t +b +p +o + +a +r +d +l +́ +ŋ diff --git a/full_models/bcc-script_arabic/D_100000.pth b/full_models/bcc-script_arabic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..72b62f06789ff6cac4e86241fbcd94e6cdc3a32c --- /dev/null +++ b/full_models/bcc-script_arabic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5021a86ea53f5f474484e9b1cc93be9ad9b8ab5ffed147fed54432c61d35f7a +size 561098185 diff --git a/full_models/bcc-script_arabic/G_100000.pth b/full_models/bcc-script_arabic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..97283ef603a5dabe7504647b945931d73b6e381f --- /dev/null +++ b/full_models/bcc-script_arabic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8031f446698f0b73cda9b5cd84bc30938678258a38c25a538013ea9160d0cd0f +size 436519617 diff --git a/full_models/bcc-script_arabic/config.json b/full_models/bcc-script_arabic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bcc-script_arabic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bcc-script_arabic/vocab.txt b/full_models/bcc-script_arabic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f53dda6abe5958c789d289a9ad2b0ec998a4dd10 --- /dev/null +++ b/full_models/bcc-script_arabic/vocab.txt @@ -0,0 +1,31 @@ +پ +م +ٹ +ی +ت +ێ +ے +چ +ڈ +ا +ن +ش +آ +ب +ۆ +ه +د +ڑ +ک +ز +ل +ژ +و +س +_ + +گ +ج +ر +ئ +- diff --git a/full_models/bcc-script_latin/D_100000.pth b/full_models/bcc-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e0725aea8a1f7d8130f90022d9669a5ee3013db --- /dev/null +++ b/full_models/bcc-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d6af5a302d185e650b210ee1999f5558077d6b96e3c89fc2636163cd7b14fe6 +size 561078380 diff --git a/full_models/bcc-script_latin/G_100000.pth b/full_models/bcc-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5900e9164aa84406c4f4df6fdf5144086298f527 --- /dev/null +++ b/full_models/bcc-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016bf10682ffb4d6a60f044faaa5e9ec171e109b0015fe7b75d1000501b33baa +size 436357441 diff --git a/full_models/bcc-script_latin/config.json b/full_models/bcc-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/bcc-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bcc-script_latin/vocab.txt b/full_models/bcc-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d4bc85c22bb9aeb92b5a5820fb51c07fc0f16aec --- /dev/null +++ b/full_models/bcc-script_latin/vocab.txt @@ -0,0 +1,29 @@ +| +a +á +n +h +t +r +s +o +k +i +m +e +d +g +é +y +b +w +p +l +c +ó +z +j +u +' +- + diff --git a/full_models/bcl/D_100000.pth b/full_models/bcl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1550d4845182b87f69de094cf404f4f725e0d8ee --- /dev/null +++ b/full_models/bcl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54774dd27622aec963cdc3ef72833a55fdcf3ad162d36d46359bc448fab404b8 +size 561077950 diff --git a/full_models/bcl/G_100000.pth b/full_models/bcl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e51fb8368d76e9e501bb0ea40dee5208ecfffd4a --- /dev/null +++ b/full_models/bcl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d64d4b627d4203119b6320a14f0589cc70a8f75c9be43d63c3df294af259f94c +size 436362047 diff --git a/full_models/bcl/config.json b/full_models/bcl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bcl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bcl/vocab.txt b/full_models/bcl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b97a3d77a0e91b1d4a2954f63e6ad97d86b46910 --- /dev/null +++ b/full_models/bcl/vocab.txt @@ -0,0 +1,31 @@ +a +| +n +i +g +o +s +k +m +d +t +u +l +p +b +r +y +h +e +w +j +- +c +f +— +z +v +' +q +x + diff --git a/full_models/bcw/D_100000.pth b/full_models/bcw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..115b733a8a4e7bb9e9aed97cf79894ec29be586d --- /dev/null +++ b/full_models/bcw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2415b0647064c8d28a1b1e4f94774a01334716c611ba0bd1af2710af407450 +size 561076165 diff --git a/full_models/bcw/G_100000.pth b/full_models/bcw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5a2624e3a9270edb66f14a9a7213d0371acf9c5b --- /dev/null +++ b/full_models/bcw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41cd7562440aece58dde3d8fc1409f29a8f7931132399f60a50213fca7b62350 +size 436339646 diff --git a/full_models/bcw/config.json b/full_models/bcw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bcw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bcw/vocab.txt b/full_models/bcw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2f768f581d3f2586892e881623bfb5700b0d2f43 --- /dev/null +++ b/full_models/bcw/vocab.txt @@ -0,0 +1,29 @@ +| +a +ə +i +h +n +m +s +w +k +t +y +g +z +l +b +d +v +r +e +' +ŋ +p +c +ɓ +f +ɗ +j + diff --git a/full_models/bdg/D_100000.pth b/full_models/bdg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7fceeec75f03fec81f58a4a3311ad0d0655a0915 --- /dev/null +++ b/full_models/bdg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce18ff916eabda4c9cd4a0b41b7cb58924a5be70dbeec3ed7844e30664ed34af +size 561098185 diff --git a/full_models/bdg/G_100000.pth b/full_models/bdg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cf6c3fe2d600715f72845b553500178784ec5a2c --- /dev/null +++ b/full_models/bdg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:946ece8fd7e344455aac4d91c6e3684aa6081a714722c08d3f15aa3155b75028 +size 436503489 diff --git a/full_models/bdg/config.json b/full_models/bdg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bdg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bdg/vocab.txt b/full_models/bdg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6ad7ad0e1bc2ae49d18df17ac27322e611ef32eb --- /dev/null +++ b/full_models/bdg/vocab.txt @@ -0,0 +1,24 @@ +a +m +i +u +e +y +k +' +w +_ +p +n +l +h +g +r +d +s +t + +b +j +- +o diff --git a/full_models/bdh/D_100000.pth b/full_models/bdh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..138134e4c6b6c988ad150bee78ce920acb462ad1 --- /dev/null +++ b/full_models/bdh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56fa4e76591ad978bcefd81767cf0b6ac5665c8ced73699c85bd93baa88a2ba +size 561098185 diff --git a/full_models/bdh/G_100000.pth b/full_models/bdh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..306b916e33dc6e331663feb9bea37ae265b9b30a --- /dev/null +++ b/full_models/bdh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f18f7c28b52bfd29c1faeeeb8cf557a98bc9f239ba5a77c8bc7dab4593a536f +size 436538049 diff --git a/full_models/bdh/config.json b/full_models/bdh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bdh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bdh/vocab.txt b/full_models/bdh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24f716a9580c8d84042171ed4dfbf5166751fac2 --- /dev/null +++ b/full_models/bdh/vocab.txt @@ -0,0 +1,39 @@ +ṿ +ú +b +a +d +_ +ṛ +w +ị +c +r + +é +ṇ +ɨ +f +s +v +' +á +o +m +ụ +k +h +í +́ +ó +l +ꞌ +n +i +y +p +t +u +g +e +z diff --git a/full_models/bdq/D_100000.pth b/full_models/bdq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b66a142fee3afcba278036c71e61bc24b3f8e632 --- /dev/null +++ b/full_models/bdq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b951740480dcb5f76071f6336860ad600e48cb68534de280c87554e3c4947e25 +size 561078605 diff --git a/full_models/bdq/G_100000.pth b/full_models/bdq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ffb30e5e3993229b6ebb68136fcc59a7569972e0 --- /dev/null +++ b/full_models/bdq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65566612778ba881df572289c7006f81dbed6b644a920de2087abccfd7424616 +size 436376001 diff --git a/full_models/bdq/config.json b/full_models/bdq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bdq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bdq/vocab.txt b/full_models/bdq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..552f5be666785a4d8f5ce40cf07bf12493ae9766 --- /dev/null +++ b/full_models/bdq/vocab.txt @@ -0,0 +1,37 @@ +| +ơ +n +h +i +k +a +g +t +m +o +l +ă +b +e +u +s +p +r +̆ +ư +d +' +ô +đ +ĕ +y +- +ê +j +c +ŏ +w +â +ŭ +ĭ + diff --git a/full_models/bdu/D_100000.pth b/full_models/bdu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1848697b9a2cc715c28d7222d231acae7a8b54fa --- /dev/null +++ b/full_models/bdu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf483e42e3d9ab4e202423f70ee973db95f90f7b833147f3ffba050fde356b1 +size 561110625 diff --git a/full_models/bdu/G_100000.pth b/full_models/bdu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ee9def48c27d98b5b82a0865e317d1ee24da7abb --- /dev/null +++ b/full_models/bdu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6428db4b16d96f24aa6c015f878868a3502e38b8b76def7f0e5d5339134416e6 +size 436636241 diff --git a/full_models/bdu/config.json b/full_models/bdu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bdu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bdu/vocab.txt b/full_models/bdu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..26b13e27690f23343ac01f1f52a05b7ebf3d174f --- /dev/null +++ b/full_models/bdu/vocab.txt @@ -0,0 +1,45 @@ +| +a +o +n +b +i +ɗ +ɛ +e +m +k +s +ɔ +t +u +y +g +j +w +' +f +d +- +ŋ +r +p +h +c +l +0 +1 +7 +v +2 +4 +z +6 +8 +9 +5 +– +3 +ó +x + diff --git a/full_models/bdv/D_100000.pth b/full_models/bdv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..532294082b16d0ac11600fe2a0d8f4f2934dcfd1 --- /dev/null +++ b/full_models/bdv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe7eb45c0da2c5dc7951793bea3a7cd1fd9227ac7ff7aaea539d96decaafd08 +size 561098185 diff --git a/full_models/bdv/G_100000.pth b/full_models/bdv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ec94a119a3943f73f1eeb58227329e6766f10ceb --- /dev/null +++ b/full_models/bdv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121581374164e8b0dad4cfdc1c1a30aa18dc5af2883f484ae49081f82dd248b4 +size 436538049 diff --git a/full_models/bdv/config.json b/full_models/bdv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bdv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bdv/vocab.txt b/full_models/bdv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5e42288049a17155fbd1c157e09d6b1479e68f3f --- /dev/null +++ b/full_models/bdv/vocab.txt @@ -0,0 +1,39 @@ +' +ଞ +ତ +ବ +ସ +ୱ +‍ +ଂ +ଚ +େ +ଜ +ଟ +ନ +ଡ +ହ +ଦ +ଏ +ଙ +୍ +ଗ +କ +ଅ +ଉ +ର +ଇ +ା +ଃ +ଆ +ୁ +ଣ +ଳ +ମ +_ +ପ +ି +ଁ + +ୟ +ଲ diff --git a/full_models/beh/D_100000.pth b/full_models/beh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f961cfa59733c13e315592b7c08539b1d66f0037 --- /dev/null +++ b/full_models/beh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:605bdffe5046bde32eeb5594ae5ed1c4e11a0997f2e9b13d9735c744dce13b30 +size 561098185 diff --git a/full_models/beh/G_100000.pth b/full_models/beh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..943dea65a57e4fce9e0b274f25f714da64c2c5a7 --- /dev/null +++ b/full_models/beh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28655338c0367274fa007aac27111bc7568253176e776fab388b7146d274f807 +size 436519617 diff --git a/full_models/beh/config.json b/full_models/beh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/beh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/beh/vocab.txt b/full_models/beh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2a6b9e78179ae8e017d16ddc88915441331d358b --- /dev/null +++ b/full_models/beh/vocab.txt @@ -0,0 +1,31 @@ +f +á +s +é +u +m +ó +k +- +l +i +r +w +d +h + +_ +y +g +t +́ +o +e +c +a +í +p +ǝ +ú +n +b diff --git a/full_models/bem/D_100000.pth b/full_models/bem/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f6cd1e5b61e583b638d80a03c1dcb3ee04383a96 --- /dev/null +++ b/full_models/bem/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cbd0d38776d41ad136c9a09197f97d8f4bbb31c03a361ddcac92e3053db1839 +size 561079219 diff --git a/full_models/bem/G_100000.pth b/full_models/bem/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..763899ce41c1862aa87a05b5b017015de5645fd1 --- /dev/null +++ b/full_models/bem/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330294cf20416f177d328b93480e77ac1173755dc57f0c94b160786656c52726 +size 436371430 diff --git a/full_models/bem/config.json b/full_models/bem/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bem/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bem/vocab.txt b/full_models/bem/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3d8a1c1385037460ca84f6d17556813210955719 --- /dev/null +++ b/full_models/bem/vocab.txt @@ -0,0 +1,33 @@ +| +a +i +u +e +l +n +k +m +b +o +w +s +t +y +p +h +f +c +g +d +r +' +ū +ā +ē +ī +ō +ŋ +j +- +– + diff --git a/full_models/ben/D_100000.pth b/full_models/ben/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..44fae202c089bfb4f3f04a16c62d0b4f23efa2db --- /dev/null +++ b/full_models/ben/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f38db13f66121e42eebbd344c97ab87142ed617380664231b300d776a03f94 +size 561110095 diff --git a/full_models/ben/G_100000.pth b/full_models/ben/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cb1105ae544104454a9adfce36ed3fd23fabc6f7 --- /dev/null +++ b/full_models/ben/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c140f81ea84ef1c10d6000895b5002657466467e62628d31e0d96187e8a5643 +size 436700030 diff --git a/full_models/ben/config.json b/full_models/ben/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ben/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ben/vocab.txt b/full_models/ben/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..a60ec003506c95d6bc81b05882fb1a12bc4d49cb --- /dev/null +++ b/full_models/ben/vocab.txt @@ -0,0 +1,74 @@ +6 +এ +ৃ +5 +ু +ঞ +প +ঘ +8 +ক +ল +9 +ি +ঃ +থ +1 +ভ +দ +ী +_ +স +ড +ঢ +ছ +ই +ং +ঁ +আ +ব +হ +' +2 +— +ঈ +ঊ +ঐ +্ +ে +য +খ +ূ +ম +ত +ঝ +ৌ +4 +ষ +জ +শ +ঔ +অ +ণ +ৎ +7 +ও +ট +ৈ + +ধ +া +ন +0 +3 +ঋ +ফ +চ +উ +- +় +র +ঙ +গ +ো +ঠ diff --git a/full_models/bep/D_100000.pth b/full_models/bep/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3914f16eae21920a3201f1f79279fcc3c7873d57 --- /dev/null +++ b/full_models/bep/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45ba108092081bf38471968d5aa1a4a96b56e03019043e1051c764afe990175a +size 561098185 diff --git a/full_models/bep/G_100000.pth b/full_models/bep/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a3cec94a22170aca14909237e005c86da0240767 --- /dev/null +++ b/full_models/bep/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edbbdff09341217a98a479b95b51db3d96beb0f26af6053028b151b87da5a383 +size 436510401 diff --git a/full_models/bep/config.json b/full_models/bep/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bep/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bep/vocab.txt b/full_models/bep/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5193c5951f77a0bfce7f703f5116cdbb7dbb4902 --- /dev/null +++ b/full_models/bep/vocab.txt @@ -0,0 +1,27 @@ +á +o +j +' + +i +u +d +n +_ +k +ꞌ +g +b +r +- +a +t +w +p +l +c +s +h +m +e +ó diff --git a/full_models/bex/D_100000.pth b/full_models/bex/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..df13b93101ec8a96830bef0cbabf361cb1861be5 --- /dev/null +++ b/full_models/bex/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a0a2f68d17e1c4b4be81a94d94d882273160bd0e7b2b9d85ac6f293eb54320 +size 561078766 diff --git a/full_models/bex/G_100000.pth b/full_models/bex/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e753b8b4533fec60a40c52aadac8f78257e83494 --- /dev/null +++ b/full_models/bex/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db3c12181f72160d30b96799b93657219f98aaa28a39701b26f73f6495838a8b +size 436369603 diff --git a/full_models/bex/config.json b/full_models/bex/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bex/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bex/vocab.txt b/full_models/bex/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7367f86d31046b233fea20a884a73e209909679f --- /dev/null +++ b/full_models/bex/vocab.txt @@ -0,0 +1,33 @@ +| +a +i +k +ɔ +e +n +d +m +b +o +ï +t +' +l +y +g +ö +r +ë +u +z +ŋ +p +s +j +w +c +h +3 +8 +2 + diff --git a/full_models/bfa/D_100000.pth b/full_models/bfa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f381971b2ff2679519d6e938803f74f483223e2 --- /dev/null +++ b/full_models/bfa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b914bdf51ae4c535814a8d2eb3603c5840a6ee22408df3aa38095004756b9691 +size 561098185 diff --git a/full_models/bfa/G_100000.pth b/full_models/bfa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81f9eb799682db5a8efc5285a8e6b773c6f40467 --- /dev/null +++ b/full_models/bfa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0409ad930d0ad0b826d6848b499afde26415c4e1f5c23f8fb7c3df46b718a5ea +size 436512705 diff --git a/full_models/bfa/config.json b/full_models/bfa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bfa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bfa/vocab.txt b/full_models/bfa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2e83f52ee806876d9c77d51fa30de75eec47a9d8 --- /dev/null +++ b/full_models/bfa/vocab.txt @@ -0,0 +1,28 @@ +' +h +r +o +y +a +— +i +g +m +_ +l +s + +n +u +k +j +ŋ +ö +- +d +p +e +w +t +é +b diff --git a/full_models/bfo/D_100000.pth b/full_models/bfo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..73549fe25ebe293634627ba8abece89517f38efd --- /dev/null +++ b/full_models/bfo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0bcf3c6b88fb854bb3fe014a3a5cde3db1c4a5413200ac598ca1082b2c9a205 +size 561098185 diff --git a/full_models/bfo/G_100000.pth b/full_models/bfo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c3ac8ea5168976134dce8f68609f6b72154d99d1 --- /dev/null +++ b/full_models/bfo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aec2afb64295c036083c7c754cb06249356bc8ba68101c8bad9080dc5e737ac +size 436561089 diff --git a/full_models/bfo/config.json b/full_models/bfo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bfo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bfo/vocab.txt b/full_models/bfo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8666891ac42fce54c07f6f0624698a77a0634130 --- /dev/null +++ b/full_models/bfo/vocab.txt @@ -0,0 +1,49 @@ +g +j +ẽ +s +ʻ +ꞌ +u +ʋ +w +õ +k +v +d +m +́ +ú +r +1 +o +p +t +n +f +— +ũ +é +c +_ +ɛ +- + +i +ʼ +ŋ +e +h +á +y +ĩ +̃ +ɩ +ↄ +ƴ +ã +a +b +l +ɓ +ı diff --git a/full_models/bfy/D_100000.pth b/full_models/bfy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..03f48ea0ac57cafc0fc96fbb53cb2f3789e356fe --- /dev/null +++ b/full_models/bfy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25a518f8e8bd8594db0f3c2716b7f687812d86db15f359b1d24b62c0519a8879 +size 561098185 diff --git a/full_models/bfy/G_100000.pth b/full_models/bfy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf6cbc35596d09f29b34ea88ae10572c3b627a2c --- /dev/null +++ b/full_models/bfy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a2cb7fd6409b2a926f225d879ebc579d3303312f91ac385a8ec1db72f8f160 +size 436572609 diff --git a/full_models/bfy/config.json b/full_models/bfy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bfy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bfy/vocab.txt b/full_models/bfy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..50736a716227c257cde28624a7e744c3ac1593f5 --- /dev/null +++ b/full_models/bfy/vocab.txt @@ -0,0 +1,54 @@ +़ +ौ +छ +द +व +स +ह +1 +ू +ि +ट +' +े +य +_ +क +अ +आ +उ +ै +ध +ल + +ब +प +फ +ढ +ड +ई +च +झ +म +ओ +ु +घ +भ +ा +ं +ग +ख +ी +- +ऊ +इ +र +थ +ो +त +न +ँ +ज +् +ठ +ए diff --git a/full_models/bfz/D_100000.pth b/full_models/bfz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a194026748c1ead140f8b869e5082186da311083 --- /dev/null +++ b/full_models/bfz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4d60abff7791722529daa67f4b795eb7fcb750665aff28e48df1bcf72571cb +size 561098185 diff --git a/full_models/bfz/G_100000.pth b/full_models/bfz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6f68ad0c731ce92b3e487270e502f21ed5879321 --- /dev/null +++ b/full_models/bfz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b891bfecc5e478a1516dfbce3fb54cec64e0179b71ccb5f733576fa54a0ed03 +size 436593345 diff --git a/full_models/bfz/config.json b/full_models/bfz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bfz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bfz/vocab.txt b/full_models/bfz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0038e1f4bfd969efcd35bfbd3161f6b87058aac9 --- /dev/null +++ b/full_models/bfz/vocab.txt @@ -0,0 +1,63 @@ +अ +- +भ +ु +ठ +त +र +़ +आ +8 +ी +प +् +‍ +ग +ू +ढ +फ +ट +ै +च +य +छ +ँ +ं +ए +घ +द +स +म +इ +_ +औ +क +ई +उ +ऊ +ध +थ + +ञ +ा +झ +ल +ब +ड +ो +ह +4 +ण +श +ष +ौ +ः +ि +े +न +ख +व +ज +ृ +ऐ +ओ diff --git a/full_models/bgc/D_100000.pth b/full_models/bgc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2f87d7f3d2c7f7e9538dd37622ba4ffbb5afe276 --- /dev/null +++ b/full_models/bgc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7092bf057f1cc9c21cabdbd11ae7ea2436b2c08a8f5a912c4d4fe617bf060497 +size 561098185 diff --git a/full_models/bgc/G_100000.pth b/full_models/bgc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..36b2861078d1f76916579419fba0f3e3e55ae14b --- /dev/null +++ b/full_models/bgc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:717630c1c2d83821f0e85211d2f13f982719734a43049f82999ac5a13de630b4 +size 436593345 diff --git a/full_models/bgc/config.json b/full_models/bgc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bgc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bgc/vocab.txt b/full_models/bgc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b9f1dc3b3578975bd6518b50f917008fad4ab018 --- /dev/null +++ b/full_models/bgc/vocab.txt @@ -0,0 +1,63 @@ +े +ै +र +औ +श +ढ +ृ +ख +ठ +ह +ि +फ +न +प +व +झ +ू +च +ग +ँ +थ +ए +ा +द +ओ +उ +् +ऐ +_ +घ +अ +आ +- +य +' +ं +ब +ु +ज + +ो +ल +इ +ण +ष +म +‍ +ऊ +ी +भ +स +़ +ध +ौ +ञ +ऋ +ट +ड +छ +क +ई +ळ +त diff --git a/full_models/bgq/D_100000.pth b/full_models/bgq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ef78d4e488479c52cc8189d3ae8f86f83efa3956 --- /dev/null +++ b/full_models/bgq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197ca40393a1529fd03375db83f8e993c51c055ad6b5aaf20c40e2ad84b97def +size 561098185 diff --git a/full_models/bgq/G_100000.pth b/full_models/bgq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..473299e487497a19cdda2a9ca1b58c593db512c4 --- /dev/null +++ b/full_models/bgq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f576e31b7e6476abf16d2586f73fa992e24b51585bc2da9f4942919a2db65f +size 436591041 diff --git a/full_models/bgq/config.json b/full_models/bgq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bgq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bgq/vocab.txt b/full_models/bgq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4a883336f9c0a60537fa2abd3e8f3aec92805131 --- /dev/null +++ b/full_models/bgq/vocab.txt @@ -0,0 +1,62 @@ +उ +ए +झ +ू +ठ +ी +ण +ड +म +न +य +अ +इ +6 +् +2 +ह +ं +ज +आ +ढ +0 +प +भ +ओ +व +ऊ +_ +क +ख +' +ळ +1 +ो +च +ौ +स + +त +ऐ +ब +5 +ई +ध +ल +छ +3 +ै +़ +ा +ु +- +ट +फ +4 +घ +ग +थ +द +े +र +ि diff --git a/full_models/bgr/D_100000.pth b/full_models/bgr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e1684414adb7c520df8bdd32d71b86b753168980 --- /dev/null +++ b/full_models/bgr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a216b1d30493bb6a952026d11ab3ac65873ee897516ab771b171ee9db3645002 +size 561078876 diff --git a/full_models/bgr/G_100000.pth b/full_models/bgr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe8c7108aabbe5fd784f4b24253a01e5bc79b101 --- /dev/null +++ b/full_models/bgr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f522502ca198aaa6bf3cc10ca1ec14bba78d5cb67d9e9ff10ea3f0842982ef +size 436377168 diff --git a/full_models/bgr/config.json b/full_models/bgr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bgr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bgr/vocab.txt b/full_models/bgr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e8d0b9b91f0291a3455658feb7b2c4b85801242d --- /dev/null +++ b/full_models/bgr/vocab.txt @@ -0,0 +1,36 @@ +| +a +h +n +i +u +l +t +k +e +m +g +s +w +â +c +r +p +d +o +z +ê +b +f +v +û +ṭ +j +î +' +- +à +1 +y +q + diff --git a/full_models/bgt/D_100000.pth b/full_models/bgt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dad8170402a04cc56efa8429ca3dcbad3a5d5408 --- /dev/null +++ b/full_models/bgt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a77460c03b0c9d2190d36014a7ff1b955d5a8b6972b6e4263573507b919a865e +size 561098185 diff --git a/full_models/bgt/G_100000.pth b/full_models/bgt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d529f8c4a2fb42981e2bb68cb47b644036a41928 --- /dev/null +++ b/full_models/bgt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0006fcbaa1e3c35ee052f2fb4f7436f95285899a77be130040be860f333b54 +size 436505793 diff --git a/full_models/bgt/config.json b/full_models/bgt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bgt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bgt/vocab.txt b/full_models/bgt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5fc74e5afe94aa7d695e352e53928d3c208dedf9 --- /dev/null +++ b/full_models/bgt/vocab.txt @@ -0,0 +1,25 @@ + +' +o +a +p +m +e +w +u +i +j +c +k +n +r +g +s +h +l +t +b +_ +v +f +d diff --git a/full_models/bgw/D_100000.pth b/full_models/bgw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..95d2ba3122b24c6d7effb188562c342bdad24e42 --- /dev/null +++ b/full_models/bgw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b76495202fee8430878dd27be62c5d33a023562afc0b58ffddcdcfd7aa18b1f3 +size 561098185 diff --git a/full_models/bgw/G_100000.pth b/full_models/bgw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..31f91d39af1c3b54c110fd84aa12f87f24c8a18c --- /dev/null +++ b/full_models/bgw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143141d93d03ff4ec0dc73985f7e215fd2fe0d49d9d3d7565a91d313cabd9b93 +size 436544961 diff --git a/full_models/bgw/config.json b/full_models/bgw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bgw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bgw/vocab.txt b/full_models/bgw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2810d19cecbc5ebba9174775a2b2df6f25265ce7 --- /dev/null +++ b/full_models/bgw/vocab.txt @@ -0,0 +1,42 @@ +ल +ख +इ +ा +र +स +ह +ि +ई +ी +ब +त +य +ं + +े +म +च +ऊ +ए +ू +ड +ग +6 +ु +उ +भ +क +ओ +‍ +' +ट +़ +अ +द +व +न +ो +आ +ज +प +_ diff --git a/full_models/bha/D_100000.pth b/full_models/bha/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d368839e19dff5bde9ccb3e1b256a46e7e6bad69 --- /dev/null +++ b/full_models/bha/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d965ad4b3d5fc28d82c6e316764ded5ab6145df80be85ee6c3fd9f6873ae84a +size 561098185 diff --git a/full_models/bha/G_100000.pth b/full_models/bha/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ebb4118db5f0c502cfcc80c44438981394bd6673 --- /dev/null +++ b/full_models/bha/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7959be573ec9ad1aabd41cb10320071931c8d1fb88d81b5cec8115d779193154 +size 436556481 diff --git a/full_models/bha/config.json b/full_models/bha/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bha/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bha/vocab.txt b/full_models/bha/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1b71e778811f0f5dfae765c09bae4f1d4d249c91 --- /dev/null +++ b/full_models/bha/vocab.txt @@ -0,0 +1,47 @@ +फ +ठ +म +ु +न +इ +स +त +ल +ं +ग +ट +ए +् +' +घ +थ +_ +ख +व +ढ +ो +ड +य +र +छ +अ +द +भ +झ +ू +च +े +ई +प +ह +ज +आ +़ +क +- +ा +ऊ + +ी +ध +ब diff --git a/full_models/bht/D_100000.pth b/full_models/bht/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..36be4acfd896038a18bc9aed0eec3a9dc5e70b12 --- /dev/null +++ b/full_models/bht/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee3de1aa490b9d53a5f7eed86fe9580722a2eddc688b92e7c614d58a21d7c727 +size 561079011 diff --git a/full_models/bht/G_100000.pth b/full_models/bht/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e053fc226dc2c6d1fde981a9491ebc24829f033 --- /dev/null +++ b/full_models/bht/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2741a8f24ef1338316bc24dee4013fccbf76a4d3cbd997de423245f62f75f13a +size 436449647 diff --git a/full_models/bht/config.json b/full_models/bht/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bht/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bht/vocab.txt b/full_models/bht/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a75cf5fd3ee6ce12fab4335850ab8c39c6222287 --- /dev/null +++ b/full_models/bht/vocab.txt @@ -0,0 +1,67 @@ +| +ा +े +र +क +ी +द +स +न +ं +ि +ो +य +ल +त +ज +् +ह +म +प +ु +ब +ण +ै +च +श +ग +ई +उ +ड +़ +अ +ू +व +भ +इ +ख +थ +ऐ +आ +फ +छ +ध +झ +ट +ठ +ओ +घ +ौ +ष +- +ए +ढ +ँ +ऊ +ञ +ृ +औ +‍ +ॉ +0 +' +4 +3 +5 +2 + diff --git a/full_models/bhz/D_100000.pth b/full_models/bhz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c22849856229644b6749f7beedbc522ccb09b212 --- /dev/null +++ b/full_models/bhz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7276ab43c3440407344397963716f468bf9d8649a405c7117e7920a08b30793 +size 561098185 diff --git a/full_models/bhz/G_100000.pth b/full_models/bhz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2894c1b6c3c01aaf02d3a86a23a58f63448235b0 --- /dev/null +++ b/full_models/bhz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3311451acb96a73a6e65652dfe25a1f4e6599be949241541dfb09b6d29f850b5 +size 436508097 diff --git a/full_models/bhz/config.json b/full_models/bhz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bhz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bhz/vocab.txt b/full_models/bhz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..72a7b64e177e2c4c8cd3a764abe10baa1518f342 --- /dev/null +++ b/full_models/bhz/vocab.txt @@ -0,0 +1,26 @@ +e +b +t +— +h +ꞌ +l +n +r +_ +k + +d +g +w +u +p +' +o +- +s +a +m +á +ó +i diff --git a/full_models/bib/D_100000.pth b/full_models/bib/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d03147f93aeb4d90610dc1aab9b0888d42ec1340 --- /dev/null +++ b/full_models/bib/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0040522cfd76d76e04701caee65209b7842c9b225fab3640becff1af0ade8a +size 561078622 diff --git a/full_models/bib/G_100000.pth b/full_models/bib/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2370e3ef9592b67f495b592b13b582cd21052115 --- /dev/null +++ b/full_models/bib/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7d56e0b0e790f9e10d121252e2b3c51b51c167544b1f65a8bfe1fba41b47ed +size 436369846 diff --git a/full_models/bib/config.json b/full_models/bib/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bib/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bib/vocab.txt b/full_models/bib/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4180aaa7512b5585eebd4aec84ab77c3f61921fc --- /dev/null +++ b/full_models/bib/vocab.txt @@ -0,0 +1,34 @@ +| +a +ɔ +ɩ +n +m +b +ʋ +k +r +y +ɛ +s +o +w +i +' +ŋ +d +t +e +h +z +g +l +u +ə +c +p +j +f +v +- + diff --git a/full_models/bim/D_100000.pth b/full_models/bim/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..474c652e4dfd27d147e1df76202216c1cb97fb65 --- /dev/null +++ b/full_models/bim/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a5c1540ca23c89354c81dbd362bd88aa92648bf0741a8b28455ef12b450ffb +size 561078728 diff --git a/full_models/bim/G_100000.pth b/full_models/bim/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..425fddc7496698ea547c6d0d4c61de50818eabf7 --- /dev/null +++ b/full_models/bim/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f888738d429024b8c20aecf9ebe0a3f5e43b3135358c7173dfc37f7c38f101 +size 436365499 diff --git a/full_models/bim/config.json b/full_models/bim/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bim/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bim/vocab.txt b/full_models/bim/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a3939e652c929929b04139314a0ebe4aeca8603b --- /dev/null +++ b/full_models/bim/vocab.txt @@ -0,0 +1,31 @@ +| +a +n +i +k +e +b +t +u +o +m +ɔ +r +s +y +ŋ +p +l +d +j +w +g +f +h +- +c +' +ƒ +q +ê + diff --git a/full_models/bis/D_100000.pth b/full_models/bis/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..53df4a8896d27553e19a01b23654a587130df4ce --- /dev/null +++ b/full_models/bis/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21ec42a5f7fc11f80b0d47704f2c30c5228b9dc0fff2a2798ff373059a4f487 +size 561078592 diff --git a/full_models/bis/G_100000.pth b/full_models/bis/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f1d92cd6b7fb9bf069608e9b23e4e03862782b7 --- /dev/null +++ b/full_models/bis/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6515d4f8292a93dd48873e4edb99ccef0e31281553715e7f01e9e95fbc137785 +size 436352924 diff --git a/full_models/bis/config.json b/full_models/bis/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bis/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bis/vocab.txt b/full_models/bis/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f2eaf7e34684e03e949cbb253d86620fd96c4077 --- /dev/null +++ b/full_models/bis/vocab.txt @@ -0,0 +1,27 @@ +| +a +o +e +l +m +n +i +g +t +s +b +u +f +k +y +w +p +r +h +d +v +j +- +' +6 + diff --git a/full_models/biv/D_100000.pth b/full_models/biv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8d8c1bc9d80724995587db6c21d097bb3bc27038 --- /dev/null +++ b/full_models/biv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14f83c2005fd6c6d9d7ac2f0879d7319e3d6f29679c5110b8eee785476902473 +size 561078861 diff --git a/full_models/biv/G_100000.pth b/full_models/biv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8d922cb107ab2ff549ba55983fcd18644a815c88 --- /dev/null +++ b/full_models/biv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5e47864d218d52d8afaea2981156ab81def2ec2d448ab499bb75b4032541e4 +size 436380757 diff --git a/full_models/biv/config.json b/full_models/biv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/biv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/biv/vocab.txt b/full_models/biv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..be48e48fde4fc50664e3cf867bae368dc01fd127 --- /dev/null +++ b/full_models/biv/vocab.txt @@ -0,0 +1,38 @@ +| +a +n +ɩ +ɛ +ɔ +b +r +ʋ +y +l +̃ +s +k +t +e +m +w +i +p +o +u +ã +' +j +d +f +h +c +ŋ +g +ũ +v +õ +ẽ +ĩ +- + diff --git a/full_models/bjr/D_100000.pth b/full_models/bjr/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..c6c4439ad67cda35d0bca6c661d8966afd0b0a0f --- /dev/null +++ b/full_models/bjr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2054903eff26280e4aa72dd283a3de9c42de15165238dea635852c6f8b047a85 +size 561076199 diff --git a/full_models/bjr/G_100000.pth b/full_models/bjr/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..61b74f6fda2b184a5eb6afdf36042e646df1b555 --- /dev/null +++ b/full_models/bjr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8586e9bf58655f3b0b88efd9c7017ce1e54d0fa1b16feadc49d5e9edd74b61 +size 436362804 diff --git a/full_models/bjr/config.json b/full_models/bjr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bjr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bjr/vocab.txt b/full_models/bjr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..74aa451b89c328653101d17a1745ff580a8910ad --- /dev/null +++ b/full_models/bjr/vocab.txt @@ -0,0 +1,39 @@ +a +| +i +n +q +m +o +r +u +e +f +s +k +d +t +í +á +y +p +b +é +ú +ó +h +g +- +0 +̱ +2 +w +1 +4 +5 +' +6 +9 +7 +ṉ + diff --git a/full_models/bjv/D_100000.pth b/full_models/bjv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..68ba0da486c898f41d38ec61559e77637b011f35 --- /dev/null +++ b/full_models/bjv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6558b7c11c80301323e259f350080da7bb824f65301fc76d4ccef6e993ff5a98 +size 561078766 diff --git a/full_models/bjv/G_100000.pth b/full_models/bjv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..97b93c7ccf9a93a51145e931db719199f8188b1e --- /dev/null +++ b/full_models/bjv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fc8e2bb18deb0cff6e659a764080380982fbd51d9be39690364bbe3453117c2 +size 436363478 diff --git a/full_models/bjv/config.json b/full_models/bjv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bjv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bjv/vocab.txt b/full_models/bjv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7e30025f043584c3906f4ba7d1271126570b6981 --- /dev/null +++ b/full_models/bjv/vocab.txt @@ -0,0 +1,31 @@ +| +ɨ +a +n +ə +k +e +t +d +j +l +m +o +g +i +r +ɔ +s +- +u +w +b +y +ɓ +ḛ +̰ +p +é +ḭ +h + diff --git a/full_models/bjw/D_100000.pth b/full_models/bjw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8cb1d248d589988c76c8217b53c4e6bd42d1adc0 --- /dev/null +++ b/full_models/bjw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15c3ea4c0c25c62298f2aa1df60557752ad6f7fc34f39bbf6a049c73c9d5188 +size 561098185 diff --git a/full_models/bjw/G_100000.pth b/full_models/bjw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02a93dd065af670e704b9ca27f6158974680c2d6 --- /dev/null +++ b/full_models/bjw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c56aa4075726653c1408748e81508c00e3d55f286ee2222e85cc440eb3fff9 +size 436528833 diff --git a/full_models/bjw/config.json b/full_models/bjw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bjw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bjw/vocab.txt b/full_models/bjw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..77b1330814faf54f5777d91f3372d70c3c1e7efd --- /dev/null +++ b/full_models/bjw/vocab.txt @@ -0,0 +1,35 @@ +w +ö +c +ü +d +ä +ë +f +e +m +l +u +ɔ +o +ɩ +s +g +t +b +y +r +‐ +ŋ +ɛ +' +i +ʋ +p +a +_ +n +j +k +v + diff --git a/full_models/bjz/D_100000.pth b/full_models/bjz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6becdf5547735a118b4a52e3690691b2c20b4c01 --- /dev/null +++ b/full_models/bjz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb66658a699c99a17f67d8e7d77a60e57b0ae14e8d0354083849a191d1171c4 +size 561098185 diff --git a/full_models/bjz/G_100000.pth b/full_models/bjz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..18a00bc7674ffb3cde604eb7fc3c646ec7df29f0 --- /dev/null +++ b/full_models/bjz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41952fa84e2239abf88a8e2d6e70b941e64b5803c5f14638f56df3a4871c1238 +size 436556481 diff --git a/full_models/bjz/config.json b/full_models/bjz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bjz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bjz/vocab.txt b/full_models/bjz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ebfe35da0a792a7384b9f513ea2629e16f0449a4 --- /dev/null +++ b/full_models/bjz/vocab.txt @@ -0,0 +1,47 @@ +9 +o +ú +ã +k + +ũ +j +h +- +_ +b +ó +1 +i +0 +y +u +é +g +' +v +e +t +í +f +c +2 +n +l +s +4 +5 +r +ĩ +m +3 +q +d +7 +w +8 +á +6 +a +p +ẽ diff --git a/full_models/bkd/D_100000.pth b/full_models/bkd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a816c85c7c31ce5871355de9fcc8bf9b8a431222 --- /dev/null +++ b/full_models/bkd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71649b54eb1b7af5bff2cfe421d239cd758bf0b59f39d66d0ab53919d9505563 +size 561098185 diff --git a/full_models/bkd/G_100000.pth b/full_models/bkd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf53dc771c77d763a1c9a0a8debda5e9693f4cc0 --- /dev/null +++ b/full_models/bkd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc489212a72dda61ba459e3e6ae86aecf411e51192cb2dd763119fffa25aeae +size 436544961 diff --git a/full_models/bkd/config.json b/full_models/bkd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bkd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bkd/vocab.txt b/full_models/bkd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..65aa3e320ff5c737170a54700233b989f3bd78a2 --- /dev/null +++ b/full_models/bkd/vocab.txt @@ -0,0 +1,42 @@ +w +- +c +3 +k +l +v + +p +7 +4 +r +' +x +0 +2 +5 +z +t +à +m +ù +j +n +a +_ +u +s +y +b +9 +o +1 +g +h +e +d +ì +i +f +6 +è diff --git a/full_models/bkv/D_100000.pth b/full_models/bkv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..46dde26ad2aab198fbd430d37e11458095212025 --- /dev/null +++ b/full_models/bkv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d802626927075cd58f9e9a26729dcf072346037be4ab44aa0a417c6b924a0097 +size 561078492 diff --git a/full_models/bkv/G_100000.pth b/full_models/bkv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d1fc0cd11ead2b9f7a79e31508f68f26b85ec924 --- /dev/null +++ b/full_models/bkv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:035ac3f7e3503cee01bb675aabdf5358dfe24f95374f1dee230e25be02c53259 +size 436415173 diff --git a/full_models/bkv/config.json b/full_models/bkv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bkv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bkv/vocab.txt b/full_models/bkv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4b466542a67eed699f2e0136216df9f5527377a1 --- /dev/null +++ b/full_models/bkv/vocab.txt @@ -0,0 +1,54 @@ +| +a +i +n +e +g +u +' +k +h +b +m +y +o +r +t +c +s +w +d +p +j +f +è +- +ì +l +é +á +ú +í +ē +ě +ī +ū +̀ +à +ā +ò +ù +ǹ +ó +ń +ō +̄ +î +û +0 +ḿ +â +ǎ +7 +8 + diff --git a/full_models/blh/D_100000.pth b/full_models/blh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1b217cee636c0e88e9174ac4732bde816247110a --- /dev/null +++ b/full_models/blh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82ccc4fb5d2f2e59e6c1042bf1816a5b020eaedc1d89eea9ef60671667695550 +size 561098185 diff --git a/full_models/blh/G_100000.pth b/full_models/blh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..875ccf90b2f670ddf8020febd62d649682805274 --- /dev/null +++ b/full_models/blh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:619853d2cbb7e7f656e07c6f86572bc498c04d2225a6f5e8453a4946fc5adf37 +size 436551873 diff --git a/full_models/blh/config.json b/full_models/blh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/blh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/blh/vocab.txt b/full_models/blh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2a9bfd65a14d9e31a7e2d16fa8d3e7d0b5840454 --- /dev/null +++ b/full_models/blh/vocab.txt @@ -0,0 +1,45 @@ +ù +w +e +ó +_ +ě +p +y +è +a +i +ǔ +̀ +ǎ +á +ŋ +b +ɤ +s +k +u +í +ɔ +j +m +l +ò +ì +f +t +n +ú +g +é +o +ǐ +1 +̌ + +ŏ +d +ɛ +à +v +́ diff --git a/full_models/blt/D_100000.pth b/full_models/blt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1bd3e78954ab9741d282a068df2c23848aa19913 --- /dev/null +++ b/full_models/blt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3729a708a62d908231a1446595d4fa89df11ed8b8d209225a23f7de8a2bca3 +size 561098185 diff --git a/full_models/blt/G_100000.pth b/full_models/blt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..264a95423799870e8d166552d1e39cf8435601c9 --- /dev/null +++ b/full_models/blt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c3de1d620e57f952111d0935409103b5990497861ed53ed754be0c42459dc5 +size 436609473 diff --git a/full_models/blt/config.json b/full_models/blt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/blt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/blt/vocab.txt b/full_models/blt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..29a65dbe5558b1f1ac11098bfa9c107bc0bf018f --- /dev/null +++ b/full_models/blt/vocab.txt @@ -0,0 +1,70 @@ +ụ +m +e +ệ +ộ +ẹ +n +v +c +ă +ỉ +ê +ô +ở + +k +i +ứ +a +_ +s +q +0 +h +ú +9 +ọ +‐ +ắ +o +ể +2 +5 +l +u +ơ +ế +ỏ +t +ả +á +d +í +ẳ +é +ợ +7 +ẻ +p +ố +b +ạ +g +1 +' +3 +ử +ặ +ị +ư +ổ +y +8 +ớ +ự +ó +đ +ủ +4 +6 diff --git a/full_models/blx/D_100000.pth b/full_models/blx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5f35d336054cfedf4543f87f8bd21a431f06dcf2 --- /dev/null +++ b/full_models/blx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783b964ec73285e8af690406dc74141c6a1774b638a6960dc228058ce32b1f5e +size 561098185 diff --git a/full_models/blx/G_100000.pth b/full_models/blx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81f348b409a4ae0754f5a355f6dfd843adb0c749 --- /dev/null +++ b/full_models/blx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e32b30e3bd464c86650fb9fcea2bb1b4346bad71c2b2b4524bfad8769196544 +size 436519617 diff --git a/full_models/blx/config.json b/full_models/blx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/blx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/blx/vocab.txt b/full_models/blx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..11691f8f7049896c24b9f0d0f2aedac7a28f3a15 --- /dev/null +++ b/full_models/blx/vocab.txt @@ -0,0 +1,31 @@ +o +d +k +w +f +a +n +_ +g +' +q + +u +t +ê +- +l +j +s +c +h +p +e +y +r +v +i +x +m +b +z diff --git a/full_models/blz/D_100000.pth b/full_models/blz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3451584cca5fa1288b626b8bfa42bf7cd0e43452 --- /dev/null +++ b/full_models/blz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff4d8bb32b116412f0306e0260b3943179808d7362efb32104e7c7e945d62bd +size 561078705 diff --git a/full_models/blz/G_100000.pth b/full_models/blz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4c952a0d9bad99fecc03ad349aeda83bf4f9c2bb --- /dev/null +++ b/full_models/blz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54dc0cbc7b87ff81eb3ec847530cd06f5e5e8669c519819ce63972092037bdaa +size 436355260 diff --git a/full_models/blz/config.json b/full_models/blz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/blz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/blz/vocab.txt b/full_models/blz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d0e7f36d75f90c0e15038fed63d2f751745e3b90 --- /dev/null +++ b/full_models/blz/vocab.txt @@ -0,0 +1,28 @@ +a +| +n +i +o +u +m +' +k +s +e +t +l +g +r +p +b +y +d +w +- +h +f +j +z +c +— + diff --git a/full_models/bmq/D_100000.pth b/full_models/bmq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..193ec2b55a413863168ccdc8843ab3682a455b29 --- /dev/null +++ b/full_models/bmq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50a8feb99aac690cec13a3f871537d0486b3c34e5634dec3f703f7ab07390bed +size 561098185 diff --git a/full_models/bmq/G_100000.pth b/full_models/bmq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..873aff9c8c66eee1c9ed344fd9e9983a6309979b --- /dev/null +++ b/full_models/bmq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600de658bd774aef5b07df6a5805fc8d063dd8b96c7af795a6fc04c0c28a603c +size 436558785 diff --git a/full_models/bmq/config.json b/full_models/bmq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bmq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bmq/vocab.txt b/full_models/bmq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3bf28f6ded495595ec53ba600188b01935457f32 --- /dev/null +++ b/full_models/bmq/vocab.txt @@ -0,0 +1,48 @@ +ɲ +h + +s +d +ɛ +v +l +ā +w +í +̀ +c +ū +ò +u +ē +e +i +m +à +y +ɓ +ú +è +a +– +f +ì +t +g +b +ō +o +n +_ +z +̄ +k +ù +r +p +' +á +é +- +ī +ó diff --git a/full_models/bmr/D_100000.pth b/full_models/bmr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0841722c8322c1b156b6aa1433b48c0d330dec2e --- /dev/null +++ b/full_models/bmr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ead91056fb9ffb6952c9761b7b28d7a47919ad1663951349c4e33ab2931bb5d7 +size 561098185 diff --git a/full_models/bmr/G_100000.pth b/full_models/bmr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bcab4593509c21e28a707a02617af54d93d7c854 --- /dev/null +++ b/full_models/bmr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8613e54f85185ce6341b477d7d80348bb06d6b6a3fa85e0086f7a1c317cd0981 +size 436517313 diff --git a/full_models/bmr/config.json b/full_models/bmr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bmr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bmr/vocab.txt b/full_models/bmr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..49ff608f37cbad87fb7e9111d235cc3cf4570f40 --- /dev/null +++ b/full_models/bmr/vocab.txt @@ -0,0 +1,30 @@ +k +q +y +c +f +x +u +t +i +ɨ +g +h +ñ +b +o +j +r +l +z +- +v +_ +d +a +e +s +p +m +n + diff --git a/full_models/bmu/D_100000.pth b/full_models/bmu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2c2b25821ab6d131e8c7fb34d29ed75a793b78df --- /dev/null +++ b/full_models/bmu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7243dceb9619b00a1cd23c888388387b0b8a091fc1fb8314df8becedf8e295e +size 561098185 diff --git a/full_models/bmu/G_100000.pth b/full_models/bmu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2f373adb1ca5ee1a770805857809c96a78845356 --- /dev/null +++ b/full_models/bmu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526b784218d2df89861cee3aa15dee9b305b995d9de2b6efb00cb9fb396e57eb +size 436538049 diff --git a/full_models/bmu/config.json b/full_models/bmu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bmu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bmu/vocab.txt b/full_models/bmu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b84af31f584e42635f212982bc44d11781a8d38a --- /dev/null +++ b/full_models/bmu/vocab.txt @@ -0,0 +1,39 @@ +b +j +8 +z +l +a +e +u +ŋ +7 +i +k +n +3 +2 +4 +o +s +_ +g +q +' +1 +6 +5 +y +f + +9 +d +r +m +w +h +- +0 +ö +t +p diff --git a/full_models/bmv/D_100000.pth b/full_models/bmv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..28ec9e5be5fbe1c6a979522598e400bb36583a84 --- /dev/null +++ b/full_models/bmv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8cd15a8be0e13b253a0ffd59a55dcad1bceb4aa1794a180fed2f9fe04bf0232 +size 561098185 diff --git a/full_models/bmv/G_100000.pth b/full_models/bmv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3e43033d7269225b38e9d9e51daa020ee305443b --- /dev/null +++ b/full_models/bmv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43265b424895b61b1273fa26a790dab225a4660b94a926a4ea7f22ffaa23b05f +size 436540353 diff --git a/full_models/bmv/config.json b/full_models/bmv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bmv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bmv/vocab.txt b/full_models/bmv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1d29d7ee6e496a401e1f6002136c60fe54477f3a --- /dev/null +++ b/full_models/bmv/vocab.txt @@ -0,0 +1,40 @@ +t +ê +h +g +i +à +ò +f +m +è +a +k +ù +ì +ô +̀ + +u +j +ə +w +e +ɨ +b +- +s +̂ +o +y +c +_ +l +û +ŋ +n +d +' +p +â +î diff --git a/full_models/bng/D_100000.pth b/full_models/bng/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3be2dac6098aac38c6ef92afc4429663d3cc39ac --- /dev/null +++ b/full_models/bng/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a18e2415c2d82ac0bdf8631faa238567d6aab49e81f54f56bd0377e59a839f7 +size 561078964 diff --git a/full_models/bng/G_100000.pth b/full_models/bng/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a65ce1e90d8306369f2104df932355f81ef9cbe6 --- /dev/null +++ b/full_models/bng/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa012f4324b738a10ee23ca3ceee25763dbd2defb646aefba34722d1bfc765e +size 436440940 diff --git a/full_models/bng/config.json b/full_models/bng/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bng/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bng/vocab.txt b/full_models/bng/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1de185348f6c847441888b0bd72d299d9297644d --- /dev/null +++ b/full_models/bng/vocab.txt @@ -0,0 +1,63 @@ +| +ে +া +র +্ +ন +ত +ি +ক +য +ব +ম +দ +ল +স +প +় +ু +আ +ো +শ +ছ +জ +হ +এ +ই +ী +গ +খ +থ +ও +ষ +ধ +ভ +চ +অ +ঁ +ং +ট +ণ +ড +উ +ূ +ঈ +ৃ +ঙ +ফ +ঠ +ঘ +ৌ +ঞ +ৎ +ৈ +ঝ +ঃ +ঐ +ঢ +- +ঋ +' +p +ঊ + diff --git a/full_models/bno/D_100000.pth b/full_models/bno/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..094d6b1d876d555f6c5f69304ca2d638edb7b401 --- /dev/null +++ b/full_models/bno/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1ecf31e80b3ecba77616953c6d782d086bf34b45f9a662625a0eea4c750217e +size 561098185 diff --git a/full_models/bno/G_100000.pth b/full_models/bno/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8ce561fd212f287c60d85fcbfd69000a7aeaae3f --- /dev/null +++ b/full_models/bno/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39fa2f95c77b97d546f52d6516d58bb22d36d78b40cdcad0b01e88f394f654a +size 436524225 diff --git a/full_models/bno/config.json b/full_models/bno/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bno/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bno/vocab.txt b/full_models/bno/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..63cfb0028384f6c5d188fef4985dcaaa06440fbd --- /dev/null +++ b/full_models/bno/vocab.txt @@ -0,0 +1,33 @@ +c +b +q +é +z +à +i +_ +g +t +a +' +m +h +k +s + +- +y +á +v +w +o +p +d +u +l +r +x +e +f +j +n diff --git a/full_models/bnp/D_100000.pth b/full_models/bnp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..abfe8550280062c20f615a2fb6101d3f5f3bdd05 --- /dev/null +++ b/full_models/bnp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18fb0fcd59198b2b5e4ffe6ed731d7991e24503b95fa0bace26d9399cf220901 +size 561098185 diff --git a/full_models/bnp/G_100000.pth b/full_models/bnp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5fa9d27dae00a06a90656564ac7f2cd39e0ee1af --- /dev/null +++ b/full_models/bnp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79e4c8ac78ab8b4b0c4ce07b13ed72da14642ea84550c347dc10bf1b89bbd5b6 +size 436526529 diff --git a/full_models/bnp/config.json b/full_models/bnp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bnp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bnp/vocab.txt b/full_models/bnp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7085dffd3a7012ed44902564d718a49924e33eee --- /dev/null +++ b/full_models/bnp/vocab.txt @@ -0,0 +1,34 @@ +­ +3 +t +a +6 +u +8 +l +p +o +d +s +1 +r +n +- +_ +i +m +e +h +2 +5 +b +v +7 +4 + +k +g +0 +' +9 +j diff --git a/full_models/boa/D_100000.pth b/full_models/boa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7eec057a868e945b4b3d19a04a7ee4826ec9fad6 --- /dev/null +++ b/full_models/boa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef713028f42d1b84a8029edb2129f736e6b8eecaca949d81471b861b818e9780 +size 561078741 diff --git a/full_models/boa/G_100000.pth b/full_models/boa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed81c2541666b577a869e90d718f13cf9e9aa1ef --- /dev/null +++ b/full_models/boa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc613459fc6aa3a37b138bf945a0f2caa42c12d85c85c1b3cc030b0d1ceff61 +size 436395821 diff --git a/full_models/boa/config.json b/full_models/boa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/boa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/boa/vocab.txt b/full_models/boa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b28ddfee64e2f96bc209538af5aa70a51b7617ec --- /dev/null +++ b/full_models/boa/vocab.txt @@ -0,0 +1,45 @@ +| +á +e +é +a +í +m +t +j +y +ú +h +u +i +n +c +d +b +ɨ +v +s +r +ó +o +l +́ +p +k +w +ñ +— +g +- +0 +1 +7 +4 +2 +3 +5 +6 +8 +' +9 + diff --git a/full_models/bod/D_100000.pth b/full_models/bod/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..937fc73dde0f0d2da79eaed6d1f37ac956af44b7 --- /dev/null +++ b/full_models/bod/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cbe52dd5ebe1cfda20d5d32710dcf672a7d80f8afe31c3a07db6e4f9cf01614 +size 561078210 diff --git a/full_models/bod/G_100000.pth b/full_models/bod/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed9be1494b68761def01a78e4b7550b5e4b41178 --- /dev/null +++ b/full_models/bod/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22de6799e7aa73021a1151e3b9d95dc27579074d2b2f904ec82d18a7e7e464c4 +size 436425755 diff --git a/full_models/bod/config.json b/full_models/bod/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bod/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bod/vocab.txt b/full_models/bod/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8ffb1c4a3a0444133e856de378994ceb8e625d54 --- /dev/null +++ b/full_models/bod/vocab.txt @@ -0,0 +1,60 @@ +་ +ས +ི +ད +ག +ོ +ན +ང +བ +མ +ར +ུ +ེ +ྱ +འ +ལ +པ +ཁ +ཡ +ཀ +ྲ +ཞ +ཅ +ཕ +ྣ +ཆ +ྟ +ཐ +ཤ +ྐ +ཏ +ཉ +ྒ +ཚ +ཟ +ཱ +ླ +ྡ +ཙ +ྨ +ྤ +ཇ +ྗ +ཛ +ྔ +ཨ +ྩ +ཧ +ྙ +ྷ +ྦ +ྫ +ྕ +ྭ +ཝ +ཻ +ཌ +ཊ +ཪ + diff --git a/full_models/boj/D_100000.pth b/full_models/boj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..285260acc47311863bb7be7da7b576415928451c --- /dev/null +++ b/full_models/boj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9bb058abb2a773116fbefddbcdfcf067c74ff5bb27247ad91b13011f91e45e1 +size 561098185 diff --git a/full_models/boj/G_100000.pth b/full_models/boj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..597fe4a78291aaa92a8ad7846d5632ef69c5ef89 --- /dev/null +++ b/full_models/boj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce1204cfe3d85849e206edf7d9a294a925fefdc740ed5a1c90ea7f491ad4f64f +size 436535745 diff --git a/full_models/boj/config.json b/full_models/boj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/boj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/boj/vocab.txt b/full_models/boj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7e6bca46b227b370995a916c1ed3fd574a8ec029 --- /dev/null +++ b/full_models/boj/vocab.txt @@ -0,0 +1,38 @@ +ñ +f +8 +9 +6 +j +1 + +b +' +y +3 +_ +v +r +u +d +n +0 +o +i +g +4 +t +h +w +s +7 +m +p +q +ŋ +2 +e +k +l +5 +a diff --git a/full_models/bom/D_100000.pth b/full_models/bom/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ddd4e8052db02867c0339f470944767824a6570 --- /dev/null +++ b/full_models/bom/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3b32d8a704e61dee64f22daaaff458b07e864a2772ee8a11c4b038cd851637 +size 561098185 diff --git a/full_models/bom/G_100000.pth b/full_models/bom/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b6216c32a52dfd70d912b11db484eb2a823848e0 --- /dev/null +++ b/full_models/bom/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d2fff83c82523e6280cce8d5f1a912f3491b2dc7eec1c75e3932205c8c85ca +size 436588737 diff --git a/full_models/bom/config.json b/full_models/bom/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bom/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bom/vocab.txt b/full_models/bom/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..166c6640f207f29e7dfbd329a86192c2ae78807d --- /dev/null +++ b/full_models/bom/vocab.txt @@ -0,0 +1,61 @@ +ō +ǒ +h +g +a +ó +k +ɛ +ǔ +ú +ò +y +é +́ +í +ê +à +i +- +— + +w +d +z +s +l +p +è +u +r +v +n +ɔ +â +á +_ +' +j +ù +c +ū +̌ +̂ +̄ +o +û +m +e +f +ī +î +t +ì +ǎ +̀ +ě +b +ā +ǐ +ô +ē diff --git a/full_models/bor/D_100000.pth b/full_models/bor/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..36266111ff24fd5f13d62c1265435e76402b4573 --- /dev/null +++ b/full_models/bor/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fad5eb51af38f9cd99ff36110bef56c7bd049d8ba2e6c613daf05f939f52108 +size 561098185 diff --git a/full_models/bor/G_100000.pth b/full_models/bor/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b2b8d04f20c96bdc08164406cb77707277e419c9 --- /dev/null +++ b/full_models/bor/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d48aa0adb0cee46711aa90e9b5c06453b0c556c150d5bcebf1986bb19cc024 +size 436561089 diff --git a/full_models/bor/config.json b/full_models/bor/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bor/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bor/vocab.txt b/full_models/bor/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2d91653c7af58c8389dcd01645761354e74cce6e --- /dev/null +++ b/full_models/bor/vocab.txt @@ -0,0 +1,49 @@ +0 +a +č +é +w +g +ê +b +o +d +q +m +v +ç +s +k +e +l +4 +6 +h +ã +x +r +á +f +n +_ +3 +2 + +i +ó +í +ü +ô +– +5 +j +' +7 +z +1 +u +c +p +â +ú +t diff --git a/full_models/bov/D_100000.pth b/full_models/bov/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e00d7e12cbfcc5667d579cf0ae26d52818f907c --- /dev/null +++ b/full_models/bov/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60118d6447d6e2c6280d81b9a43f6910d0b8e262ca69c391565e244545a1570a +size 561098185 diff --git a/full_models/bov/G_100000.pth b/full_models/bov/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..08667a2372c67d1861ef438106f957a6e18d0d75 --- /dev/null +++ b/full_models/bov/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8557e543311e2c9a077d14eca21da965d26009071d0bb3be2cc77d8eb7268d +size 436533441 diff --git a/full_models/bov/config.json b/full_models/bov/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bov/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bov/vocab.txt b/full_models/bov/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5340f112a261152095f150ef3d810319b14fb96b --- /dev/null +++ b/full_models/bov/vocab.txt @@ -0,0 +1,37 @@ +s +' +o +v +1 +̃ +_ +r +f +- +p +z +k +g +a +ã +u +h +t +́ +l +b +ó +m +y +í +w + +e +i +á +d +ɛ +ɔ +n +ũ +ĩ diff --git a/full_models/box/D_100000.pth b/full_models/box/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..61cd9ce20b24424985119d9cebd0ee07dd7deefb --- /dev/null +++ b/full_models/box/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fece6f5bdef92c23d2241d6fdc1d55c9edc1cd35e70e3307c597ed90b43576e2 +size 561098185 diff --git a/full_models/box/G_100000.pth b/full_models/box/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dc8b5e1a6dd5ce6e440ec3d1ab83a75eac3a8e6e --- /dev/null +++ b/full_models/box/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:286df31389ab3fe8d75d47a17f261663ac4bfc237f656ef947b1c524acf8ea91 +size 436561089 diff --git a/full_models/box/config.json b/full_models/box/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/box/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/box/vocab.txt b/full_models/box/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9163f9884861fd5bccd303802a6b7374c69e1e04 --- /dev/null +++ b/full_models/box/vocab.txt @@ -0,0 +1,49 @@ +d +ṹ + +b +̃ +́ +s +ń +ù +h +y +ò +ɔ +_ +o +a +ó +é +6 +è +ǹ +l +í +- +ã +m +e +ɲ +k +ɓ +n +c +t +r +f +p +ĩ +w +ì +v +u +ú +̀ +z +á +ɛ +ũ +i +à diff --git a/full_models/bpr/D_100000.pth b/full_models/bpr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f1044eb0aabbf69896557599275e8ba5f5104df6 --- /dev/null +++ b/full_models/bpr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0931393e9b5126e71a84f58fec2e495af5f9c74fb02d0d31b3afc38f6423522 +size 561078839 diff --git a/full_models/bpr/G_100000.pth b/full_models/bpr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ca3beba547d792ef5b2b41377b4432c3df0b8a76 --- /dev/null +++ b/full_models/bpr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dfff6a9a43e1eae2fc1943e76fb35e8be337b99d538f3fb2f6bc4bf0d37ff95 +size 436385977 diff --git a/full_models/bpr/config.json b/full_models/bpr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bpr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bpr/vocab.txt b/full_models/bpr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bbd08f831cf751130e01857784e90d559b79ea05 --- /dev/null +++ b/full_models/bpr/vocab.txt @@ -0,0 +1,40 @@ +| +a +n +d +i +u +l +t +m +g +e +k +o +s +y +f +b +é +w +à +è +h +ò +r +ù +ê +p +- +ì +0 +1 +2 +' +4 +3 +7 +8 +c +5 + diff --git a/full_models/bps/D_100000.pth b/full_models/bps/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..194753c76122bb632a903d4882e9083a7bc3f59c --- /dev/null +++ b/full_models/bps/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7159d898f51829452bbcf117a041ffd7bf352d836ed32760471d64089a522b67 +size 561078842 diff --git a/full_models/bps/G_100000.pth b/full_models/bps/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..28ba9b11099de1c00cc1ec06c7ee886ec8e60244 --- /dev/null +++ b/full_models/bps/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e48d47f05e9a4aba9986c4684ab28015cf1ee32a289992e6f82f655738f67ce +size 436362940 diff --git a/full_models/bps/config.json b/full_models/bps/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bps/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bps/vocab.txt b/full_models/bps/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..28ea8b7baa52bf1ab482b31297bb396e03538472 --- /dev/null +++ b/full_models/bps/vocab.txt @@ -0,0 +1,30 @@ +| +a +n +d +i +u +l +t +g +m +e +k +s +f +o +y +b +w +à +é +è +ò +h +r +ù +ê +' +ì +p + diff --git a/full_models/bqc/D_100000.pth b/full_models/bqc/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..26c05205ce3891ce9217af1633a1ba606dfeb5be --- /dev/null +++ b/full_models/bqc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ea4e21b909a0bf593ef2036bbe4d5091d12eaf2488e85540f5a9e408ba65a5 +size 561078616 diff --git a/full_models/bqc/G_100000.pth b/full_models/bqc/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..3bcb03d0d813cb09e59c155b6583edebe4855dcf --- /dev/null +++ b/full_models/bqc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83abde5ffe4691ea582dcce5d5c7556edfaea102e8f9bccf092087edeb7d0389 +size 436399019 diff --git a/full_models/bqc/config.json b/full_models/bqc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bqc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bqc/vocab.txt b/full_models/bqc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fb134ed1622352bb5a6afb5eca72a6f0b5930fbf --- /dev/null +++ b/full_models/bqc/vocab.txt @@ -0,0 +1,47 @@ +| +a +ɛ +ↄ +i +́ +l +k +u +b +̃ +s +n +p +g +m +à +e +w +o +d +ã +á +y +̀ +z +ń +ĩ +t +ũ +ì +í +ò +f +v +ó +ɔ +' +ú +è +ù +ṹ +é +ǹ +h +ḿ + diff --git a/full_models/bqi/D_100000.pth b/full_models/bqi/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..53396fe3a08f15069eea8a3692be6d63dfdd17ed --- /dev/null +++ b/full_models/bqi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b75a41e5802a2507870e97b26448661cd895015b69d73764a0d7603992d70e +size 561076145 diff --git a/full_models/bqi/G_100000.pth b/full_models/bqi/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..415757428743ec7d85275854e5b5495a7023789b --- /dev/null +++ b/full_models/bqi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c6f35feeed08a6d3e36e4feb6946476dffc373cb984aca08ee08766c6bf447 +size 436371277 diff --git a/full_models/bqi/config.json b/full_models/bqi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bqi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bqi/vocab.txt b/full_models/bqi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..330485b4ba11932769f08ca7c1d7413dc650bb47 --- /dev/null +++ b/full_models/bqi/vocab.txt @@ -0,0 +1,43 @@ +| +ی +ا +و +ه +ن +م +ر +س +ک +ب +ݚ +ت +ٚ +د +خ +ز +ل +ش +گ +پ +ع +ح +ۨ +ج +ق +چ +ف +آ +ط +غ +ص +ٛ +ذ +ض +ث +ظ +ئ +ژ +ء +ۆ +ێ + diff --git a/full_models/bqj/D_100000.pth b/full_models/bqj/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..c130b275ee1b2a332b142fcf60ff9b0a82ca8659 --- /dev/null +++ b/full_models/bqj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b028f3af0993bf0defeb05467530a4c362bdb98540fdac11751d586039463d0b +size 561110394 diff --git a/full_models/bqj/G_100000.pth b/full_models/bqj/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c5fd3d8ad1a3cf45cf5efdb451fc21f98175a1e --- /dev/null +++ b/full_models/bqj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfaf8d9101f40f3ea647b51b887cea8631df4deb779e22048b96aab81156df8a +size 436616305 diff --git a/full_models/bqj/config.json b/full_models/bqj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bqj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bqj/vocab.txt b/full_models/bqj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e965cace7b47962609bd60f2d43304a21d89fbef --- /dev/null +++ b/full_models/bqj/vocab.txt @@ -0,0 +1,37 @@ +| +a +n +u +e +i +m +o +b +g +l +t +r +j +s +f +y +h +á +w +ᵽ +ú +k +ŋ +' +ñ +é +ĉ +í +ó +d +v +c +p +- +– + diff --git a/full_models/bqp/D_100000.pth b/full_models/bqp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..84c46a605028758e8378b6079933a143b631a7b3 --- /dev/null +++ b/full_models/bqp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2fda4b1a9b1dc7ff631c4a9dd35c7205123522f39658426a98f438cad2f8fc9 +size 561098185 diff --git a/full_models/bqp/G_100000.pth b/full_models/bqp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe219498dcb4030e7fd56b49afdca7dcc00b6c5d --- /dev/null +++ b/full_models/bqp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf0a2fc166f48b8c6e92c317f3196c8bbd7f474231a101d53c9e71aa5c3598ea +size 436581825 diff --git a/full_models/bqp/config.json b/full_models/bqp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bqp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bqp/vocab.txt b/full_models/bqp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d425fdaee043519de24e6eb37baedf582484b71c --- /dev/null +++ b/full_models/bqp/vocab.txt @@ -0,0 +1,58 @@ +m +k +ɛ +á +6 +2 +5 +h +o +' +z +9 +t +p +3 +à +s +é +́ +b +ũ +8 +ń +a +v +e +ɔ +̀ +r +i +ó +y +ĩ +ḿ +- +f +ú +_ +̃ +è +0 +ã +ǹ +n +ù +ò + +d +7 +g +í +u +4 +l +ↄ +ì +1 +w diff --git a/full_models/bru/D_100000.pth b/full_models/bru/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0e6d35531902041075e98175b1c578494c869a6b --- /dev/null +++ b/full_models/bru/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b375654fa8f525d5ad4dfbf22f7ed4748d0d5e58c743aadaed837d99c3311aaa +size 561078705 diff --git a/full_models/bru/G_100000.pth b/full_models/bru/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fdd25f591d4041f0ff3e5d69e5e54b8c2313a951 --- /dev/null +++ b/full_models/bru/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358d5e7e8512ea2ef6561a9654f4ebff5eb62f5f5ecbca69bc5c553dd8e66346 +size 436403789 diff --git a/full_models/bru/config.json b/full_models/bru/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bru/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bru/vocab.txt b/full_models/bru/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..61ddbe9be1519190d2e785eb81f291717c2de130 --- /dev/null +++ b/full_models/bru/vocab.txt @@ -0,0 +1,48 @@ +| +a +n +i +c +t +h +q +g +m +s +o +u +á +r +l +p +y +â +ớ +ỡ +k +ễ +ứ +b +ũ +ĩ +ữ +ỗ +ê +‐ +d +e +ơ +í +ṓ +- +ố +ó +ô +v +ế +ō +é +ư +ú +' + diff --git a/full_models/bsc/D_100000.pth b/full_models/bsc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d459c202e01c5491d601bb040d1f516fab727911 --- /dev/null +++ b/full_models/bsc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eeb8dfb1cfa3f269a54ddbc449af7b5a9912c869d5daed2aece47e3d48736e0 +size 561098185 diff --git a/full_models/bsc/G_100000.pth b/full_models/bsc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..696671b2ab6d89c3951599e01351d7a8b866ddd8 --- /dev/null +++ b/full_models/bsc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10a49f9aaee3df671b814faf32b75d4ae33c86f05e1859e15aeb35c2921fe820 +size 436528833 diff --git a/full_models/bsc/config.json b/full_models/bsc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bsc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bsc/vocab.txt b/full_models/bsc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b7ba97d6079d863f2f69ddf2e6eb497ec36cda62 --- /dev/null +++ b/full_models/bsc/vocab.txt @@ -0,0 +1,35 @@ +ñ +l +̃ +ɗ +ŋ +ë +- +w +ɓ +e +a +c +o + +ƴ +f +p +u +ỹ +h +m +t +x +k +b +g +y +j +d +_ +r +n +i +ŝ +s diff --git a/full_models/bsq/D_100000.pth b/full_models/bsq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a3b85ef875c521749a76d723bab09ee09634daaa --- /dev/null +++ b/full_models/bsq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e4bcfb3844995b0b3f211b6137c4d271d069ceebe189ce3f1a118db5fe0eba6 +size 561078377 diff --git a/full_models/bsq/G_100000.pth b/full_models/bsq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b83509349bdedea1aeba54848f9db6268945f3de --- /dev/null +++ b/full_models/bsq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49c1a3a36a6a5d930a669e4ac8403f11f8e203b318bb7fb7ca7f091094d69d6 +size 436428974 diff --git a/full_models/bsq/config.json b/full_models/bsq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bsq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bsq/vocab.txt b/full_models/bsq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6ccafc2bc99757b167ae6a8413b4a8c55ddb75e6 --- /dev/null +++ b/full_models/bsq/vocab.txt @@ -0,0 +1,60 @@ +| +ɔ +ɛ +n +̀ +ɖ +k +ɓ +m +y +é +a +à +́ +ì +w +í +- +d +è +ě +p +á +g +u +̃ +i +s +ú +ò +b +o +ù +e +ó +j +z +t +h +c +ǎ +ḿ +ǔ +ǐ +ĩ +̌ +ǒ +f +x +ã +ń +v +ũ +̄ +ū +ṹ +ǹ +ē +' + diff --git a/full_models/bss/D_100000.pth b/full_models/bss/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7cba081e355d13f875a3594378cc824561916dd9 --- /dev/null +++ b/full_models/bss/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a46eea5a542864c7b17303597eed91fe32a91865357fb1cc0828ac400320509 +size 561078620 diff --git a/full_models/bss/G_100000.pth b/full_models/bss/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e7c093c93019c02e13f80c841e901b314259177 --- /dev/null +++ b/full_models/bss/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa281a58c2e30b9e2bbb3d3c40bb5bd094de26b99d542843ea6442faac9c9be4 +size 436426582 diff --git a/full_models/bss/config.json b/full_models/bss/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bss/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bss/vocab.txt b/full_models/bss/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..db47ca0c1dd6dd9a32e4dc7463e36da14a56098c --- /dev/null +++ b/full_models/bss/vocab.txt @@ -0,0 +1,59 @@ +| +n +b +é +ɛ +e +m +á +d +a +́ +y +l +ɔ +s +k +t +g +ə +h +w +ŋ +o +ʼ +̄ +p +í +- +c +ó +i +ē +ê +u +ǒ +â +ḿ +ě +ú +̂ +̌ +r +z +ń +ǎ +ā +ǐ +ī +ō +ô +j +î +ū +û +f +ǔ +' +v + diff --git a/full_models/btd/D_100000.pth b/full_models/btd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..63ff62535c18f8c27e18d2d8cad0fcb9f7d94e7b --- /dev/null +++ b/full_models/btd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5514a50966acf16ea2a1457ac97e2546a406f1775cdf3d5ae9331fa31af182e +size 561098185 diff --git a/full_models/btd/G_100000.pth b/full_models/btd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f71e182645a6f748d1815e7dd04229b1749f7c2b --- /dev/null +++ b/full_models/btd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82fd8c3aef816944364a519ce868ee153715ff6656652a300b2fa38287fe417a +size 436535745 diff --git a/full_models/btd/config.json b/full_models/btd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/btd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/btd/vocab.txt b/full_models/btd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8ef305dec41e70fac732feb0865708c1449d298a --- /dev/null +++ b/full_models/btd/vocab.txt @@ -0,0 +1,38 @@ +d +- +m +8 +à +w +b +l +c +h +r +q + +s +9 +o +y +2 +e +g +j +a +_ +t +f +è +3 +5 +z +i +0 +ì +p +k +n +u +1 +' diff --git a/full_models/bts/D_100000.pth b/full_models/bts/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2c092f7d68c0172baee68a9bbde605f1bf6d3029 --- /dev/null +++ b/full_models/bts/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6298edbf1db403fcb333e87de874be2037274bd3a2eee651278268e333d39eb5 +size 561078996 diff --git a/full_models/bts/G_100000.pth b/full_models/bts/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6c59d7087b6661a56a9e53b171d88fddef81e1dc --- /dev/null +++ b/full_models/bts/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae67902b04ee7dc5d844be9533766a871106fc60e81acc58ddf3adf5571202cb +size 436359253 diff --git a/full_models/bts/config.json b/full_models/bts/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bts/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bts/vocab.txt b/full_models/bts/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bf963ca99373328d6ed17ba76b3379b621e15b5b --- /dev/null +++ b/full_models/bts/vocab.txt @@ -0,0 +1,28 @@ +a +| +n +i +o +h +m +s +u +g +r +t +b +d +p +e +l +k +j +- +y +w +f +v +z +c +x + diff --git a/full_models/btt/D_100000.pth b/full_models/btt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..57e24f292e6e3677bc7a27652f887811ab7bb19e --- /dev/null +++ b/full_models/btt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b964992119001d8ad2773a34a5c1bf5cef7d350c786f1f7bd245113a572c4958 +size 561098185 diff --git a/full_models/btt/G_100000.pth b/full_models/btt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5755f7f44ea21f36127dc6bccfdb9264e7c9b162 --- /dev/null +++ b/full_models/btt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c32fd0c78a54f10afca980ce46e90cb2ebfc54a2a42f122367712d123c272d6 +size 436568001 diff --git a/full_models/btt/config.json b/full_models/btt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/btt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/btt/vocab.txt b/full_models/btt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..51286667af9f93f4705959bda41e8bd13366cd6f --- /dev/null +++ b/full_models/btt/vocab.txt @@ -0,0 +1,52 @@ +î +ǎ +i +k + +ó +ē +s +p +a +ū +í +g +û +w +á +- +ě +ê +ù +t +n +j +é +_ +l +è +f +ā +r +m +â +ǒ +z +d +y +ī +' +c +ǔ +b +ò +ǐ +ı +u +o +ì +à +ú +ō +h +e diff --git a/full_models/btx/D_100000.pth b/full_models/btx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3decee9e892b5f0bc12b9986efbc5c0b45dde34 --- /dev/null +++ b/full_models/btx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af80f7eab80c235aa2deae9c1b755412df1d73791a49c5732593210294220294 +size 561098185 diff --git a/full_models/btx/G_100000.pth b/full_models/btx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..746a9ec0c020fc991f222e2a4775f2aa9ce2aa20 --- /dev/null +++ b/full_models/btx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb61997fd692793ea1a303cf8e0f2792bcea269835e163a3cb75b6f94832e715 +size 436528833 diff --git a/full_models/btx/config.json b/full_models/btx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/btx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/btx/vocab.txt b/full_models/btx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6ccfb9fa9eca42cf3793e0e49df4a3ccbe0f3a6e --- /dev/null +++ b/full_models/btx/vocab.txt @@ -0,0 +1,35 @@ +2 +- +h +1 +t +b +p +u +r +8 +d +4 +j +0 +7 +e +3 +6 +a +' +n +i +w +k +z +y +m +_ +g +c +o + +5 +l +s diff --git a/full_models/bud/D_100000.pth b/full_models/bud/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..59cd25114fead320f535d7c21ba26cb808d5d446 --- /dev/null +++ b/full_models/bud/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b80c5a07b088f30e4298c4a33926340f083137a73a83ea9a1fd45496cab069cb +size 561078880 diff --git a/full_models/bud/G_100000.pth b/full_models/bud/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ebf99ba47abf3b722faa626f8892e5d569316946 --- /dev/null +++ b/full_models/bud/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80c08b26618d1fabe5c75412dbe77fa1dcbadc214cebf237d00a30c646ab132 +size 436411898 diff --git a/full_models/bud/config.json b/full_models/bud/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bud/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bud/vocab.txt b/full_models/bud/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..522dc7b45ef22935e8de48c217cddc09d73baaa8 --- /dev/null +++ b/full_models/bud/vocab.txt @@ -0,0 +1,51 @@ +| +i +n +a +k +e +b +u +t +í +m +ɔ +d +y +p +á +l +ŋ +- +s +o +ì +ī +à +f +ǹ +ā +c +ń +j +ú +g +r +̄ +́ +ū +é +ò +w +̃ +è +ē +ù +̀ +ĺ +ḿ +2 +ï +1 +0 + diff --git a/full_models/bul/D_100000.pth b/full_models/bul/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5cb91fb6dd27dafb839a0e166119f3e87706eec6 --- /dev/null +++ b/full_models/bul/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1a9be52b46d20a6c20954d8cc9f9f0c8988f1a276c50a566e996bf6968821d +size 561110652 diff --git a/full_models/bul/G_100000.pth b/full_models/bul/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..284e2ca6bd0046b777c4ac4f813bc0255bbe46dd --- /dev/null +++ b/full_models/bul/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c13711dede9571a8af70eb561b171a01f0fdb2047e8cc10bfb14f31ab3f3196 +size 436619192 diff --git a/full_models/bul/config.json b/full_models/bul/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bul/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bul/vocab.txt b/full_models/bul/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..0fd96247c45e5b9b8b5bd5735791b7e678eedf2c --- /dev/null +++ b/full_models/bul/vocab.txt @@ -0,0 +1,37 @@ +п +е +р +– +х +щ +- +м +у +в +ф +ѝ +г +я +к +ц +ю +̀ +и +н +л +з +_ +й +ь +ѐ +о +с +б +ж +д + +ч +ъ +т +а +ш diff --git a/full_models/bus/D_100000.pth b/full_models/bus/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..97d7b209acd8e22a8d299fdf6000fc34828e9e1d --- /dev/null +++ b/full_models/bus/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5224fd392f8b1d53894449532c7c6af16432dd2d8ed82705b8da0640cbb875d +size 561098185 diff --git a/full_models/bus/G_100000.pth b/full_models/bus/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..16cc187d5028dbd01efcad1df7c3e5a49e39f6d7 --- /dev/null +++ b/full_models/bus/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0600f4e9e5639ff112cc92bad51c914f38d427fe6bfe987312eb76e47e8b708 +size 436558785 diff --git a/full_models/bus/config.json b/full_models/bus/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bus/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bus/vocab.txt b/full_models/bus/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dec7f727ce926a504121d520b32c533c084f8819 --- /dev/null +++ b/full_models/bus/vocab.txt @@ -0,0 +1,48 @@ +e +h +n +ù +b +z +è +p +g +ã +ǹ +ó +m +s +́ +v +é +k +y +ɛ +i + +̃ +à +a +' +- +̀ +u +ↄ +ĩ +ò +l +á +ḿ +d +t +f +ú +o +ń +w +_ +í +r +ɔ +ũ +ì diff --git a/full_models/bvc/D_100000.pth b/full_models/bvc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d4fb60d3eb8c414944b34095a9f98dc4a8071bee --- /dev/null +++ b/full_models/bvc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b629fed80eeecf74b51b1c6b3873270e206a821729278069a1f4e348c77949 +size 561098185 diff --git a/full_models/bvc/G_100000.pth b/full_models/bvc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4e94fcccb78905f6fda7c76598aba17ed0c1829 --- /dev/null +++ b/full_models/bvc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23d804be14fc61eb77c8b295ccbe63ce2d809211e193a16d27efe197153d7183 +size 436521921 diff --git a/full_models/bvc/config.json b/full_models/bvc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bvc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bvc/vocab.txt b/full_models/bvc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f0f361e38a9b56ae59941283668f610aa0febe18 --- /dev/null +++ b/full_models/bvc/vocab.txt @@ -0,0 +1,32 @@ +f +6 +n +s +m +9 +3 +e +g +5 +u +4 +t +r +0 +v +' +l +k +h +d +1 +o +p +a +b +w +j +i +_ +2 + diff --git a/full_models/bvz/D_100000.pth b/full_models/bvz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..03ef5b37bfe2ab5e9ea744454284e3b6f4c649dc --- /dev/null +++ b/full_models/bvz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71214e5423f83f728255395eef75820454029227303fdb109611cc207fb22a9b +size 561098185 diff --git a/full_models/bvz/G_100000.pth b/full_models/bvz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..925ac93bd031774c5e6a309d60ee7ef8dcd93144 --- /dev/null +++ b/full_models/bvz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0522a06405383251fbf2323888a22eedb25cd8b3c894d8185584af187aa35643 +size 436510401 diff --git a/full_models/bvz/config.json b/full_models/bvz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bvz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bvz/vocab.txt b/full_models/bvz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24fbf42a1f3719b781711d8128dff848c9575f2e --- /dev/null +++ b/full_models/bvz/vocab.txt @@ -0,0 +1,27 @@ +v +r +y +m +u +j +c +d + +l +z +b +w +à +k +t +o +e +p +f +_ +s +a +g +h +i +n diff --git a/full_models/bwq/D_100000.pth b/full_models/bwq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7b277f743e15c812391e8d1a172f927bccb7cc41 --- /dev/null +++ b/full_models/bwq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b0881c395bd813f7b6235184ea6256c7f6d295392f103b4c821daf9a5a0a043 +size 561078341 diff --git a/full_models/bwq/G_100000.pth b/full_models/bwq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b0a97af5f0ff3458fdf8e755ad01d010e9ecdf39 --- /dev/null +++ b/full_models/bwq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f50e30668472d7e731c780b1cdc6ed901644db96de7212c2628dbdef86a48f6 +size 436361033 diff --git a/full_models/bwq/config.json b/full_models/bwq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bwq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bwq/vocab.txt b/full_models/bwq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b6a2309852fbf889f363badec45eff939039e94b --- /dev/null +++ b/full_models/bwq/vocab.txt @@ -0,0 +1,31 @@ +| +a +n +ɔ +e +i +ɛ +m +y +k +w +r +t +o +b +g +s +d +u +l +p +f +z +' +h +v +́ +à +ì +- + diff --git a/full_models/bwu/D_100000.pth b/full_models/bwu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..559f969b443e85b98d4499ce3bd01d8deb4d295e --- /dev/null +++ b/full_models/bwu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:209bc7dd084c5e4ccee89e8ae808dd5eae5db8876787442dbbb4764f11c13a44 +size 561078708 diff --git a/full_models/bwu/G_100000.pth b/full_models/bwu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eec5adaa8666913fc85868ac74cbcd22f96c7f46 --- /dev/null +++ b/full_models/bwu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41a6cc0a709b63189557cee13de98d55ba8480588f9af610d0da3e30d367146a +size 436353853 diff --git a/full_models/bwu/config.json b/full_models/bwu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bwu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bwu/vocab.txt b/full_models/bwu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..10049a4fa09b6b4e084621ce5f96b0cb9b84463f --- /dev/null +++ b/full_models/bwu/vocab.txt @@ -0,0 +1,27 @@ +| +a +i +e +n +m +l +k +y +u +b +t +w +s +o +d +g +r +p +j +h +c +z +f +v +' + diff --git a/full_models/byr/D_100000.pth b/full_models/byr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9adbad2814396d068493d2f7b74ec90266717077 --- /dev/null +++ b/full_models/byr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:836d2bb8dfbf4d7f38b42d1ff0fe5993161b933b622366ebfccf90b378c73860 +size 561098185 diff --git a/full_models/byr/G_100000.pth b/full_models/byr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6d08a749677888c68fb91159219cd48c39405f6b --- /dev/null +++ b/full_models/byr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5fce4eafb4c5d2fa7fc32e2c4f524e8d6cb37e3e5791b04b14100c38a27cbab +size 436533441 diff --git a/full_models/byr/config.json b/full_models/byr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/byr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/byr/vocab.txt b/full_models/byr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..52fe54d42d45c2acfd9b2ffcf4206fbd447089bd --- /dev/null +++ b/full_models/byr/vocab.txt @@ -0,0 +1,37 @@ +l +6 +m +p +v +z +3 +9 +r +a +o +h +' +j +w +4 +- +1 +g +7 +k +y + +_ +d +n +b +8 +e +ɨ +i +t +u +2 +5 +s +0 diff --git a/full_models/bzh/D_100000.pth b/full_models/bzh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..39355eec9cfed9f95b86d6d398ba213046f4f2c7 --- /dev/null +++ b/full_models/bzh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb5f36df1366343b2d1ac9f2749401b702c92a86abae7b70da58a99a08f4fc6 +size 561098185 diff --git a/full_models/bzh/G_100000.pth b/full_models/bzh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b325172725fcb3ed3e32f78f8c4c4070cf23d71 --- /dev/null +++ b/full_models/bzh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:964dc2966d13a3ece7def3a4035a83372a76b2c295a34e1ca1944dbd03d7f4d4 +size 436542657 diff --git a/full_models/bzh/config.json b/full_models/bzh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bzh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bzh/vocab.txt b/full_models/bzh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7cb6c97b6537b17a419a84c3102fafeae6e4591c --- /dev/null +++ b/full_models/bzh/vocab.txt @@ -0,0 +1,41 @@ +s +q +i +— + +k +o +w +j +a +v +e +u +8 +r +6 +- +ö +g +5 +m +d +7 +ë +2 +n +ḳ +l +ġ +' +1 +t +b +9 +y +3 +h +4 +0 +p +_ diff --git a/full_models/bzi/D_100000.pth b/full_models/bzi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0694fbf938d6aa1fc1e9817a93bb6f2c1ef8037f --- /dev/null +++ b/full_models/bzi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eedac5dab526eeac2ae9ec73927fab8c953394a93d30c4e603d222aada3ae10 +size 561098185 diff --git a/full_models/bzi/G_100000.pth b/full_models/bzi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..71aaf7a5e51fa5f107c5ff36866a159b25cb99af --- /dev/null +++ b/full_models/bzi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1317805d7d09eabf4e7f2a7977f7826e62e2aae2e1afe760abe901890405c0 +size 436614081 diff --git a/full_models/bzi/config.json b/full_models/bzi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bzi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bzi/vocab.txt b/full_models/bzi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f0128a53603b70beccf854bcdaddf65cdcd4ece9 --- /dev/null +++ b/full_models/bzi/vocab.txt @@ -0,0 +1,72 @@ +ี +ึ +่ +ร +ผ +โ +้ +ณ +า +ฺ +ค +q +ศ +7 +เ +ิ +ื +็ +น +4 +_ +- +' +ํ +ภ +ห + +ต +ด +8 +0 +ท +ฮ +ฎ +9 +๋ +1 +m +ง +ล +ม +บ +พ +ไ +ั +ุ +6 +ป +ย +แ +‍ +ฬ +ฟ +2 +ช +3 +ญ +ะ +ข +ู +ฐ +ส +อ +ว +5 +ษ +์ +ธ +ก +ซ +จ +ถ diff --git a/full_models/bzj/D_100000.pth b/full_models/bzj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5faac7d9b6c1170f6a5f6a0cef18c41996e570b5 --- /dev/null +++ b/full_models/bzj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f107ae2573a1a038dbf183f813156e62e60a5258254cc1731d9afbb58600856a +size 561078600 diff --git a/full_models/bzj/G_100000.pth b/full_models/bzj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b5342e8ef9b602de861707c480a92fd3547f736 --- /dev/null +++ b/full_models/bzj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d67a95acb48b25c0cefd39e636e1fd37c2768220b808319bfd2cd99d887fe35 +size 436357564 diff --git a/full_models/bzj/config.json b/full_models/bzj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/bzj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/bzj/vocab.txt b/full_models/bzj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1c60f9eacf1a28cfb9fce395744e1d2b80f76071 --- /dev/null +++ b/full_models/bzj/vocab.txt @@ -0,0 +1,29 @@ +| +a +n +e +h +i +d +o +s +w +t +l +u +r +k +m +f +p +g +y +b +z +v +j +c +- +' +— + diff --git a/full_models/caa/D_100000.pth b/full_models/caa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5e7f902ee816b54b665869d25ab863c1907090d8 --- /dev/null +++ b/full_models/caa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:865f016eeb463a2120752fad5fd518d0c31e082fca502eda45c41526961a1dcb +size 561077721 diff --git a/full_models/caa/G_100000.pth b/full_models/caa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c605636a457fe7087c8f9dba1bb0a8cd42b04707 --- /dev/null +++ b/full_models/caa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51da6dfb21e84b14b81dd176b2a79d2e8fe503a1f7734f79335301251d268f6 +size 436394198 diff --git a/full_models/caa/config.json b/full_models/caa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/caa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/caa/vocab.txt b/full_models/caa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8b525c390d398c0d03188e397174445d8b380def --- /dev/null +++ b/full_models/caa/vocab.txt @@ -0,0 +1,45 @@ +| +a +e +u +t +n +i +' +r +o +c +m +y +b +s +j +x +h +p +q +w +l +d +z +g +ú +á +í +— +é +f +v +ó +0 +1 +2 +5 +4 +k +3 +6 +- +9 +7 + diff --git a/full_models/cab/D_100000.pth b/full_models/cab/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..639bf51d2fe305bf1cd76668a304163549859a44 --- /dev/null +++ b/full_models/cab/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ac058a493ded827e677eb8aa52f6e78688abfdb1ae2c276ac1ae533e9c85c0 +size 561078094 diff --git a/full_models/cab/G_100000.pth b/full_models/cab/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..c174b82f0eb30dd9831a7579ec9ff8b930eae9d5 --- /dev/null +++ b/full_models/cab/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba55276bfbcb1fb8d25577f5d7dd0d9bb4e92318261f59e009e8b3598db31c3 +size 436366646 diff --git a/full_models/cab/config.json b/full_models/cab/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cab/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cab/vocab.txt b/full_models/cab/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..223fed834bd3cad583f116d8731582331e2dc31f --- /dev/null +++ b/full_models/cab/vocab.txt @@ -0,0 +1,33 @@ +| +a +u +i +n +l +g +e +r +b +h +d +m +s +ü +t +ñ +á +í +w +f +o +é +k +ú +y +c +ó +p +— +ǘ +- + diff --git "a/full_models/cac-dialect_sanmateoixtat\303\241n/D_100000.pth" "b/full_models/cac-dialect_sanmateoixtat\303\241n/D_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..2a24832dbcca1cf81bd22dc398196f65f706f699 --- /dev/null +++ "b/full_models/cac-dialect_sanmateoixtat\303\241n/D_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e738549c0224d01a1efd2e4c997517d9b2aee5b3b96f1e8144cba1b82c26fc7e +size 561098185 diff --git "a/full_models/cac-dialect_sanmateoixtat\303\241n/G_100000.pth" "b/full_models/cac-dialect_sanmateoixtat\303\241n/G_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..e46191ded101fff5f6c05606af0834128473c8f2 --- /dev/null +++ "b/full_models/cac-dialect_sanmateoixtat\303\241n/G_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b42f5090658c2d4268c098fb4e2c8dd6916799100676d301f2b8eadbdc17f4b +size 436549569 diff --git "a/full_models/cac-dialect_sanmateoixtat\303\241n/config.json" "b/full_models/cac-dialect_sanmateoixtat\303\241n/config.json" new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ "b/full_models/cac-dialect_sanmateoixtat\303\241n/config.json" @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git "a/full_models/cac-dialect_sanmateoixtat\303\241n/vocab.txt" "b/full_models/cac-dialect_sanmateoixtat\303\241n/vocab.txt" new file mode 100755 index 0000000000000000000000000000000000000000..54f72d3adbd0eb8ef83e48a722d9d07f60c6b58c --- /dev/null +++ "b/full_models/cac-dialect_sanmateoixtat\303\241n/vocab.txt" @@ -0,0 +1,44 @@ +q +1 +b +3 +a +e +c +d +p +n +m +_ +4 +ú +é +ó +h +7 +y +i +g + +t +z +o +' +j +v +0 +8 +x +- +̈ +6 +9 +l +2 +u +s +í +f +5 +á +r diff --git "a/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/D_100000.pth" "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/D_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..ff8b41d7300348bcbb9516e38702e1f38e948c54 --- /dev/null +++ "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/D_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01039e8d33cd86e36e29b6215d051f6f5cb49bfa6c256686e657d13a8229f2ca +size 561078705 diff --git "a/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/G_100000.pth" "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/G_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..c28892abe165f7d69aa88d63e1505bd3c7d12512 --- /dev/null +++ "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/G_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b11347a1733a072a4bb08b1826baf825b73a72c86775dc056c0e8b32a7e83e9 +size 436398936 diff --git "a/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/config.json" "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/config.json" new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/config.json" @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git "a/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/vocab.txt" "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/vocab.txt" new file mode 100755 index 0000000000000000000000000000000000000000..453816d9779aeea24b5f64f1b00ebfb745aff237 --- /dev/null +++ "b/full_models/cac-dialect_sansebasti\303\241ncoat\303\241n/vocab.txt" @@ -0,0 +1,47 @@ +| +a +' +c +n +i +t +e +o +j +l +y +u +s +x +b +h +w +m +z +̈ +p +q +r +d +ú +g +— +í +é +v +á +f +ó +- +4 +2 +0 +1 +9 +3 +6 +7 +5 +8 +k + diff --git a/full_models/cak-dialect_central/D_100000.pth b/full_models/cak-dialect_central/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c43b693e1dd90c257b1a18beeb3160c777222e74 --- /dev/null +++ b/full_models/cak-dialect_central/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09f3027fbd4198f9e57c043eab56201df57d8153c004fc71d99c9f347151b167 +size 561077825 diff --git a/full_models/cak-dialect_central/G_100000.pth b/full_models/cak-dialect_central/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5a9bd3508a5ff7e7737c19829cc10e4584c16a1a --- /dev/null +++ b/full_models/cak-dialect_central/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee4b896d96fd2024def9c9a524f01004fcd3eda50c524ccfd1ce207fbbf0b20 +size 436384990 diff --git a/full_models/cak-dialect_central/config.json b/full_models/cak-dialect_central/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cak-dialect_central/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cak-dialect_central/vocab.txt b/full_models/cak-dialect_central/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e8ac3a0c5b5e898075f80c08de30f4ee411718c2 --- /dev/null +++ b/full_models/cak-dialect_central/vocab.txt @@ -0,0 +1,45 @@ +| +i +a +r +' +n +k +e +j +o +c +h +u +t +l +q +x +y +m +w +b +s +p +- +z +d +á +ú +í +g +é +f +v +ó +0 +4 +1 +2 +5 +6 +7 +3 +à +ì + diff --git "a/full_models/cak-dialect_santamar\303\255adejes\303\272s/D_100000.pth" "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/D_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..95590a2283b56c4d20d28992e8a35714ce874578 --- /dev/null +++ "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/D_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d293cde60ccb371374bd23d3e08adbc35995ef79f51f7f26ad9466f53b4b59 +size 561076158 diff --git "a/full_models/cak-dialect_santamar\303\255adejes\303\272s/G_100000.pth" "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/G_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..fadf7c8648196468ca85221e2184d9fcc7f1aa75 --- /dev/null +++ "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/G_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4738f4a1f734636bbb87d2ebcdc3bc8c0c1703fb1331db8e5a13773bbbcbe99a +size 436353311 diff --git "a/full_models/cak-dialect_santamar\303\255adejes\303\272s/config.json" "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/config.json" new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/config.json" @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git "a/full_models/cak-dialect_santamar\303\255adejes\303\272s/vocab.txt" "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/vocab.txt" new file mode 100755 index 0000000000000000000000000000000000000000..b27d78655248afdb2864bf2f7d204c95ec3e112a --- /dev/null +++ "b/full_models/cak-dialect_santamar\303\255adejes\303\272s/vocab.txt" @@ -0,0 +1,35 @@ +| +i +a +' +r +n +c +u +e +o +j +t +h +x +s +m +l +k +y +q +p +v +- +b +d +z +f +á +g +í +ú +é +ó +ñ + diff --git a/full_models/cak-dialect_santodomingoxenacoj/D_100000.pth b/full_models/cak-dialect_santodomingoxenacoj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5984e86aacab471e2ee0b791a2a14c0d8c5742e3 --- /dev/null +++ b/full_models/cak-dialect_santodomingoxenacoj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72956c9b5f947d814324e9018b7b9d30c0127f0e621ab68a503e69cfbf01e70c +size 561078500 diff --git a/full_models/cak-dialect_santodomingoxenacoj/G_100000.pth b/full_models/cak-dialect_santodomingoxenacoj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..97fb1dcd7ed6ab081bdf3d98ba8dd3ed347969c7 --- /dev/null +++ b/full_models/cak-dialect_santodomingoxenacoj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e1cf5236860ab73064fc44a3fb5636124054344105cfadc0277c255300dc9c +size 436396723 diff --git a/full_models/cak-dialect_santodomingoxenacoj/config.json b/full_models/cak-dialect_santodomingoxenacoj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cak-dialect_santodomingoxenacoj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cak-dialect_santodomingoxenacoj/vocab.txt b/full_models/cak-dialect_santodomingoxenacoj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..499ca83cc3894af358cac4c174d5fc07274c1270 --- /dev/null +++ b/full_models/cak-dialect_santodomingoxenacoj/vocab.txt @@ -0,0 +1,46 @@ +0 +n +t +é +6 +c +w +ó +í +o +f +a +e +h +_ +l +4 +9 +i +v +q +1 + +g +ñ +- +2 +u +m +3 +5 +z +j +r +p +ꞌ +s +8 +k +d +ú +á +x +y +b +7 diff --git a/full_models/cak-dialect_southcentral/D_100000.pth b/full_models/cak-dialect_southcentral/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5abf4a45cf6d04372c934b8638c271a5e91f6163 --- /dev/null +++ b/full_models/cak-dialect_southcentral/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1df26624e3c6f2aec6cab7527e8fa8b1b134c9863b040776dedab3ca23b7e01 +size 561078345 diff --git a/full_models/cak-dialect_southcentral/G_100000.pth b/full_models/cak-dialect_southcentral/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..06a575357ef3fd22d8b41cfb3f221a8e739196d2 --- /dev/null +++ b/full_models/cak-dialect_southcentral/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f062263ec58d408bbe1bde84340363498eaef35ee6ec50d54270d034c3630568 +size 436371417 diff --git a/full_models/cak-dialect_southcentral/config.json b/full_models/cak-dialect_southcentral/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cak-dialect_southcentral/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cak-dialect_southcentral/vocab.txt b/full_models/cak-dialect_southcentral/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b0a46e064b355cb8fb9ba2a713b38efd71239934 --- /dev/null +++ b/full_models/cak-dialect_southcentral/vocab.txt @@ -0,0 +1,35 @@ +| +i +a +r +n +c +u +' +e +o +j +h +t +l +m +x +s +q +k +y +p +v +- +b +z +d +á +f +g +ú +í +é +ó +ñ + diff --git a/full_models/cak-dialect_western/D_100000.pth b/full_models/cak-dialect_western/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..622239be4a4730b1fd1539d0d689d9ea2c2e19c4 --- /dev/null +++ b/full_models/cak-dialect_western/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6911575101a7d283b6793c155547f9d77e33cb88d5751a7945b83d8b34ab2a58 +size 561076186 diff --git a/full_models/cak-dialect_western/G_100000.pth b/full_models/cak-dialect_western/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..745113cddcbdb07a4a579c1cf9044245b370574f --- /dev/null +++ b/full_models/cak-dialect_western/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c151ea7d910ffdc49a791d048c88c888026b164028ab72f7a14c356278b45cd8 +size 436355786 diff --git a/full_models/cak-dialect_western/config.json b/full_models/cak-dialect_western/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cak-dialect_western/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cak-dialect_western/vocab.txt b/full_models/cak-dialect_western/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..43dcfbc52feed86b7af6cc9ef7f53b7e4787c412 --- /dev/null +++ b/full_models/cak-dialect_western/vocab.txt @@ -0,0 +1,36 @@ +| +i +a +c +r +' +e +u +n +h +j +o +t +y +l +x +k +m +q +s +b +w +p +z +d +f +á +ú +í +g +ó +é +v +- +ñ + diff --git a/full_models/cak-dialect_yepocapa/D_100000.pth b/full_models/cak-dialect_yepocapa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..897001dadd22d76073c9fb718d30ac2d1a7ba0bb --- /dev/null +++ b/full_models/cak-dialect_yepocapa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8afedaa20746bdadd7b526934df70a48acf2dfcdc3d73a146f66e5c265ab3b4b +size 561076200 diff --git a/full_models/cak-dialect_yepocapa/G_100000.pth b/full_models/cak-dialect_yepocapa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8719fc3c87521328fe78cf60d037bd9f5767f8d8 --- /dev/null +++ b/full_models/cak-dialect_yepocapa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aa3a2f5f0986ad14160bfa43e6bbe0973daf7a3f84bfbf78bc9acde3c5e7ece +size 436339742 diff --git a/full_models/cak-dialect_yepocapa/config.json b/full_models/cak-dialect_yepocapa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cak-dialect_yepocapa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cak-dialect_yepocapa/vocab.txt b/full_models/cak-dialect_yepocapa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..012e5c491b6739aea7b935e535e0f32e71cbec7d --- /dev/null +++ b/full_models/cak-dialect_yepocapa/vocab.txt @@ -0,0 +1,29 @@ +| +a +e +i +n +c +r +' +u +o +j +h +t +y +m +x +s +k +l +q +b +- +p +v +z +d +f +g + diff --git a/full_models/cap/D_100000.pth b/full_models/cap/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d694058bafc3c096f727bbe057a80358db618a84 --- /dev/null +++ b/full_models/cap/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e67cabffdd013c5cba5a08bbda603c94499e7a1fc60dd8fe398ddb0a710eda25 +size 561078884 diff --git a/full_models/cap/G_100000.pth b/full_models/cap/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3760b3a488cee54d3af95345ebad196d1a02f31e --- /dev/null +++ b/full_models/cap/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f930cd833084e551165c1d47f4b72fa69178cc4fce0680c16f57da87deff5d1f +size 436395990 diff --git a/full_models/cap/config.json b/full_models/cap/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cap/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cap/vocab.txt b/full_models/cap/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b219601e3afbbe7ebd1cfc41592fd34fd01b7fef --- /dev/null +++ b/full_models/cap/vocab.txt @@ -0,0 +1,44 @@ +a +| +i +n +h +k +t +ś +ź +u +l +ć +q +e +c +p +s +m +r +o +w +x +ñ +y +j +ï +ö +ä +' +d +– +ë +b +f +ü +í +é +g +z +ú +v +ó +á + diff --git a/full_models/car/D_100000.pth b/full_models/car/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..abc0288cff3e7bc8813345f0c5410ab1ce965754 --- /dev/null +++ b/full_models/car/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca809ef045db0d9e230daf5da16e8a079d75bf17dedce7cded772e64a723574 +size 561078855 diff --git a/full_models/car/G_100000.pth b/full_models/car/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a6af533c3dd33bbf5e68fb674b3bdfb49a13a0d1 --- /dev/null +++ b/full_models/car/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e0241b914940d4835294460602fb73d20c1a3ae3ec2bb7fa68df213bc78bcb +size 436356064 diff --git a/full_models/car/config.json b/full_models/car/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/car/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/car/vocab.txt b/full_models/car/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..daaab71a62a776f575d616fc634bab37c1f0d556 --- /dev/null +++ b/full_models/car/vocab.txt @@ -0,0 +1,27 @@ +| +o +a +n +m +r +' +y +k +e +t +i +p +u +w +s +j +b +d +g +l +f +h +- +v +z + diff --git a/full_models/cas/D_100000.pth b/full_models/cas/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..db4fb36291d3f9508cfe357841d529ba83dac0a7 --- /dev/null +++ b/full_models/cas/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5fde115dd7e4c686a48ba1e2e66b8dfccfc9ec9c68465599a109df3afafff3 +size 561098185 diff --git a/full_models/cas/G_100000.pth b/full_models/cas/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e6e4651b6030bcde97c88b1794b80547a75ac26f --- /dev/null +++ b/full_models/cas/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:277475d87664d465903b8d54defec242e8a112b41324552284a9f50b7b744807 +size 436584129 diff --git a/full_models/cas/config.json b/full_models/cas/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cas/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cas/vocab.txt b/full_models/cas/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dd7b4839455a664e039877eb3fa347c03ba98718 --- /dev/null +++ b/full_models/cas/vocab.txt @@ -0,0 +1,59 @@ +o +m +ñ +n + +t +ÿ +ạ +ụ +ẹ +f +s +z +l +- +4 +í +á +é +q +x +h +e +p +9 +5 +i +ä +0 +́ +j +r +̂ +3 +ọ +7 +â +6 +— +8 +ị +ĉ +a +ŝ +' +ú +1 +̣ +u +_ +b +g +̈ +c +2 +v +d +y +ó diff --git a/full_models/cat/D_100000.pth b/full_models/cat/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..19920f4b27c821563374442d6056289bce0605da --- /dev/null +++ b/full_models/cat/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f515375b914b445bb041ee57d9e4425cc75e64d2bbe62306fb268ab46b12277b +size 561110632 diff --git a/full_models/cat/G_100000.pth b/full_models/cat/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8e38aaeb27b5368a5e6c55d116f03a182819180b --- /dev/null +++ b/full_models/cat/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0382edd70333f8ddc663177e672c8a66312e1b30f7929a8f9d458ef66f6b5349 +size 436622793 diff --git a/full_models/cat/config.json b/full_models/cat/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cat/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cat/vocab.txt b/full_models/cat/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..5dab4cf295eb67fc7880288b7dcc1a5292975942 --- /dev/null +++ b/full_models/cat/vocab.txt @@ -0,0 +1,39 @@ +z +f +i +g +m +o +r +è +h +l +v +à +u +d +ú +ç +p +s +' +é +_ +- +e +a +— +x +ü +q +t +b +í +ó +ï +ò + +c +j +n +y diff --git a/full_models/cax/D_100000.pth b/full_models/cax/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4081d1464acf9e738e1aab982284be848d059ecf --- /dev/null +++ b/full_models/cax/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33f7227ce13c0f174fedb67757aeb1814e4982b2c44e14fc5446b729bb4a84bb +size 561078749 diff --git a/full_models/cax/G_100000.pth b/full_models/cax/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f7ccdc2373d4a424679afa4fcb90356a2a7aefd --- /dev/null +++ b/full_models/cax/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4686fec03cf23f8f28a564f02fdfe6f1ec26528470607c4674a31d5586fd603d +size 436375414 diff --git a/full_models/cax/config.json b/full_models/cax/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cax/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cax/vocab.txt b/full_models/cax/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..74c95d48ec28098e31deb43bf460f5f5ea4f70d0 --- /dev/null +++ b/full_models/cax/vocab.txt @@ -0,0 +1,36 @@ +a +| +i +n +t +ɨ +u +o +k +m +x +e +s +p +r +b +h +y +ñ +c +j +l +ú +d +í +– +g +é +' +f +ó +á +v +z +q + diff --git a/full_models/cbc/D_100000.pth b/full_models/cbc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6d744d540062f11f52fa0d30b969b91e1f0f5c00 --- /dev/null +++ b/full_models/cbc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae480264400041dc06d148bd6e644de2b3301007081662008f46ffae240640d1 +size 561076189 diff --git a/full_models/cbc/G_100000.pth b/full_models/cbc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d835965adb6775e49e1ede206d07fca48c439aa9 --- /dev/null +++ b/full_models/cbc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad86d1e415f03beccd944a341c38d02b6d675b82b9f2108a31287a5b61fbebc7 +size 436371891 diff --git a/full_models/cbc/config.json b/full_models/cbc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cbc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cbc/vocab.txt b/full_models/cbc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9b638d5205dce02f7de2124a65f4bbcdb50e9d50 --- /dev/null +++ b/full_models/cbc/vocab.txt @@ -0,0 +1,43 @@ +| +a +r +i +u +̶ +c +o +e +ã +m +t +n +ũ +j +p +b +ĩ +s +y +ẽ +ñ +g +q +õ +á +w +d +l +ú +í +ó +- +é +— +f +h +z +v +x +k +' + diff --git a/full_models/cbi/D_100000.pth b/full_models/cbi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0206e27b4b165dea811105c3ba5eed16ac8cb63a --- /dev/null +++ b/full_models/cbi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd7b5bf979ce76305ddfe8b4c8dca5637af9a6ad7f893a33aa2135ec9d38e416 +size 561098185 diff --git a/full_models/cbi/G_100000.pth b/full_models/cbi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..33d9a49b3fa9d632296c8c0e25cce5e83e82ad12 --- /dev/null +++ b/full_models/cbi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:877f8cb34033507dcb99ba05c8d06689fd1fe5610e7f1d84459bf9f2aedd3706 +size 436556481 diff --git a/full_models/cbi/config.json b/full_models/cbi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cbi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cbi/vocab.txt b/full_models/cbi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..12c7e213219d24740b6179ac0a18fcf77f489fc9 --- /dev/null +++ b/full_models/cbi/vocab.txt @@ -0,0 +1,47 @@ +j +w +t +q +c +v +2 +á +z +1 +4 +8 +_ + +l +5 +ú +k +ü +0 +d +9 +i +h +s +í +é +e +ñ +n +g +u +r +b +m +6 +f +o +p +3 +- +ó +y +' +7 +x +a diff --git a/full_models/cbr/D_100000.pth b/full_models/cbr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..058a574be6a6d9d980066eda3d39fb79a0441319 --- /dev/null +++ b/full_models/cbr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c3d7c2d3829dc74ea8ed57280f374a1b79204e99ad3e871ba27d4f52119ae36 +size 561098185 diff --git a/full_models/cbr/G_100000.pth b/full_models/cbr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a2925909f57740805221e83bf2f9530abe78ec2a --- /dev/null +++ b/full_models/cbr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ea9929ae6c21c3f5048297e01076979aa0ff2c6edbd84fa83f9974bc081640 +size 436535745 diff --git a/full_models/cbr/config.json b/full_models/cbr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cbr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cbr/vocab.txt b/full_models/cbr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..41de50dc327dd4c8b022be1aaf23d3d1e5fa62b6 --- /dev/null +++ b/full_models/cbr/vocab.txt @@ -0,0 +1,38 @@ +ñ +t +x +b +é +a +ú +́ +k +i +q +d +h + +— +r +' +y +á +ó +g +m +f +u +p +ü +l +s +ë +e +j +n +í +v +z +o +_ +c diff --git a/full_models/cbs/D_100000.pth b/full_models/cbs/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..26d02c03e96e466f7067e49414f8f81492b686ae --- /dev/null +++ b/full_models/cbs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6458fc4616e574a8c6b7bf56d15e940e03f3c1a6b8232823b4017713c9599b0 +size 561078457 diff --git a/full_models/cbs/G_100000.pth b/full_models/cbs/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2fe570580690f194a7866a515901af54ff86f09e --- /dev/null +++ b/full_models/cbs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ba535734107a22ad1475fd9d7425e4c22a5480415a674aff23281c38d0a0f1 +size 436396733 diff --git a/full_models/cbs/config.json b/full_models/cbs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cbs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cbs/vocab.txt b/full_models/cbs/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..50452203e9d0248432f501acfc158fe40a626495 --- /dev/null +++ b/full_models/cbs/vocab.txt @@ -0,0 +1,46 @@ +a +| +n +i +u +k +e +b +s +j +t +m +d +w +y +h +p +x +c +o +r +– +l +ú +é +í +g +0 +f +á +v +ó +z +1 +2 +q +7 +4 +' +ñ +5 +3 +6 +9 +8 + diff --git a/full_models/cbt/D_100000.pth b/full_models/cbt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..35fa63821539af70583965662bdcdc36c9057a3d --- /dev/null +++ b/full_models/cbt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd695603d04db0e8c11001f299ca7dfd1cc8842423abea5d71d031ef724a606 +size 561076204 diff --git a/full_models/cbt/G_100000.pth b/full_models/cbt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bec6d1d47832617b857cd7e081148bc3949f6a48 --- /dev/null +++ b/full_models/cbt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1a23055201aeca630e32f8a9050f89a48c911c4c68ff4cb0034662dc8f32df +size 436339785 diff --git a/full_models/cbt/config.json b/full_models/cbt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cbt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cbt/vocab.txt b/full_models/cbt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..876a416f3240b98a7a1afa721f73ec015086d125 --- /dev/null +++ b/full_models/cbt/vocab.txt @@ -0,0 +1,29 @@ +a +n +| +i +o +ë +t +h +u +ꞌ +p +r +c +s +y +q +m +' +á +í +— +ó +d +l +e +́ +f +b + diff --git a/full_models/cbu/D_100000.pth b/full_models/cbu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..adcbdce13a0b2d23fde90e411cec3e30442aff9c --- /dev/null +++ b/full_models/cbu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de63a9ab6b27e7f4e8a92324cc81d0f2d07c9611708edb38543e76a59e074da +size 561078720 diff --git a/full_models/cbu/G_100000.pth b/full_models/cbu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..abd5cd940483300e957d8f2bf43a7b33d921a7c7 --- /dev/null +++ b/full_models/cbu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bed420e6770462b70d5bb85bdd4dcb6a5c6fa6e7fb06428bb7792a317a1c194 +size 436391987 diff --git a/full_models/cbu/config.json b/full_models/cbu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cbu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cbu/vocab.txt b/full_models/cbu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ee0f60bd9e1338d5db93f839a9f1bb52d8500287 --- /dev/null +++ b/full_models/cbu/vocab.txt @@ -0,0 +1,44 @@ +a +| +i +n +s +t +u +r +h +p +m +y +k +e +g +c +l +w +o +z +á +d +b +' +j +í +x +ú +ó +f +0 +1 +v +2 +é +4 +5 +6 +3 +- +7 +9 +8 + diff --git a/full_models/cbv/D_100000.pth b/full_models/cbv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ad825f561dbe9f887e9b853db2cbd57a7262a7ee --- /dev/null +++ b/full_models/cbv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186ae6cb9b6ae9717cbcac8f2eae762a65d6bade457e93e560ea361c6e0307da +size 561076196 diff --git a/full_models/cbv/G_100000.pth b/full_models/cbv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b59ecae98a88477001ca816cea220317cccba433 --- /dev/null +++ b/full_models/cbv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f5f8f72f83e07cb85b119b58535ec99638b8a46cb594f2aa473908aca79128 +size 436380999 diff --git a/full_models/cbv/config.json b/full_models/cbv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cbv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cbv/vocab.txt b/full_models/cbv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7d0b91843f97cd561a5669b71184026d25f7952b --- /dev/null +++ b/full_models/cbv/vocab.txt @@ -0,0 +1,47 @@ +| +a +i +h +n +t +j +ʉ +e +c +á +d +p +b +o +w +ã +í +m +́ +ĩ +é +y +s +ó +ñ +u +r +̃ +g +l +q +ú +ẽ +' +— +f +v +z +õ +x +k +ò +ç +4 +1 + diff --git a/full_models/cce/D_100000.pth b/full_models/cce/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..df9a6c9209dcf7d45057f184c44701ce67ff0689 --- /dev/null +++ b/full_models/cce/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189b4091e6a6ed8407a76b6f8366b63124dd7652bd9e80635e5e4751d66571a3 +size 561078996 diff --git a/full_models/cce/G_100000.pth b/full_models/cce/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..33822fc78eed48e49efe80d4c2b5e88b00f43844 --- /dev/null +++ b/full_models/cce/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0979eb6c6402bffb70f9b150215e4ed83b12a3e44be9bb7a03ab58f7d61f65b +size 436367065 diff --git a/full_models/cce/config.json b/full_models/cce/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cce/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cce/vocab.txt b/full_models/cce/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a0d617da898379efc3ef85442e1d7a8d7ee8610a --- /dev/null +++ b/full_models/cce/vocab.txt @@ -0,0 +1,31 @@ +| +a +i +n +u +t +k +e +o +m +h +w +s +l +g +v +d +x +y +b +r +z +p +f +j +' +ñ +- +é +` + diff --git a/full_models/cco/D_100000.pth b/full_models/cco/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..e99766c3681832bea86fe7e06b75ddecbcb0f7fe --- /dev/null +++ b/full_models/cco/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0984e8200a4fec9d0095b34d028a7d17e72dd7546962694f7d0dc8cbd648f126 +size 561076172 diff --git a/full_models/cco/G_100000.pth b/full_models/cco/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f11dc1ee58755860d0f0ba7342d1a532de4f2b5 --- /dev/null +++ b/full_models/cco/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b7f4593370991577d82a8cdde76999e1f2ec20d36189db72770b8d076ece2b +size 436380762 diff --git a/full_models/cco/config.json b/full_models/cco/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cco/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cco/vocab.txt b/full_models/cco/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..442304f9b1c2fb5516eda7a8b5bca4a1b26c8d11 --- /dev/null +++ b/full_models/cco/vocab.txt @@ -0,0 +1,47 @@ +| +a +' +i +e +n +j +̱ +ˋ +ɨ +o +g +u +l +s +d +c +ˉ +̃ +ˊ +m +é +á +í +f +́ +r +q +b +t +ˆ +ʉ +ñ +ó +ú +ø +ǿ +ü +y +h +— +p +z +v +x +k + diff --git a/full_models/cdj/D_100000.pth b/full_models/cdj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7250d75cb21fc5434b6bf6471cbf005c3993fac9 --- /dev/null +++ b/full_models/cdj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:647bcabcb7bf8ae4780404d6c6e160fde7cf283b14227e1c52aac69e5ae3bcb2 +size 561079004 diff --git a/full_models/cdj/G_100000.pth b/full_models/cdj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..102f0a239a11297b657546df5ebe8b8a7bca4a14 --- /dev/null +++ b/full_models/cdj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e765e809a4d390fb3f10b39d8111ad7b60e13b5deab5a7389c4166df3391f65 +size 436447702 diff --git a/full_models/cdj/config.json b/full_models/cdj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cdj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cdj/vocab.txt b/full_models/cdj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..270abca6ede2111556c14969c48b5e68c1d5ec68 --- /dev/null +++ b/full_models/cdj/vocab.txt @@ -0,0 +1,66 @@ +| +ा +र +ै +ि +त +ं +क +् +ी +न +स +े +म +य +ु +ह +ज +प +व +ण +ल +ब +श +अ +ई +द +ड +ग +ू +ो +़ +ऐ +भ +आ +च +उ +झ +थ +ख +ौ +ध +छ +ठ +ट +फ +- +ष +घ +ए +इ +ँ +ढ +ञ +ऊ +औ +‍ +ृ +ओ +ः +7 +5 +' +3 +0 + diff --git a/full_models/ceb/D_100000.pth b/full_models/ceb/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee7bc99c50dc994d070864bf874918075ba25187 --- /dev/null +++ b/full_models/ceb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:696209672bf15714eb2d4abef6535d25e35aa2e182ab46f5f82534d837da219b +size 561078748 diff --git a/full_models/ceb/G_100000.pth b/full_models/ceb/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..37d8771bde0b3f5b66ae7e20ab9faaa8a0e37e92 --- /dev/null +++ b/full_models/ceb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2e1201219173166a884ef443b00c01ccf924080dda67a02a538aa2c571e46a +size 436388844 diff --git a/full_models/ceb/config.json b/full_models/ceb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ceb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ceb/vocab.txt b/full_models/ceb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bb8f031ff4cea6fe0ad67a975839ab8ab87115d4 --- /dev/null +++ b/full_models/ceb/vocab.txt @@ -0,0 +1,41 @@ +0 +j +z +d +6 +s +g +w +c +- +' +9 +u +v +r +2 +e +q +5 +t +h +— +8 +1 +a +p +x + +_ +l +n +m +4 +i +k +3 +o +7 +b +f +y diff --git a/full_models/ceg/D_100000.pth b/full_models/ceg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0845c18d87dc1a527389e486302b802a67a18b40 --- /dev/null +++ b/full_models/ceg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a1460c8501d2311003c1f24960aba3b6638004d209cb25f719e49141369dc1 +size 561078596 diff --git a/full_models/ceg/G_100000.pth b/full_models/ceg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..80661fc844455d479a01ee0076d4b5427eb79c1c --- /dev/null +++ b/full_models/ceg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5349afa707fc0120a8146a31c19d44a78f38ab212f7ba37e7d5437f61948f962 +size 436394410 diff --git a/full_models/ceg/config.json b/full_models/ceg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ceg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ceg/vocab.txt b/full_models/ceg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9dda0e97a315e703bee8396f0ba66181182e17fe --- /dev/null +++ b/full_models/ceg/vocab.txt @@ -0,0 +1,45 @@ +| +e +o +h +r +ɨ +a +s +t +u +k +i +y +n +j +p +c +l +m +w +õ +d +b +z +ĩ +̵ +ũ +ã +ẽ +— +ú +g +é +f +í +ó +á +v +q +̃ +- +x +ñ +' + diff --git a/full_models/cek/D_100000.pth b/full_models/cek/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d6139fbcc1024632e0317307691652542f09669c --- /dev/null +++ b/full_models/cek/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22116f1c3b1b34667375fbd9e437b97091e7746148622fcc4e42b391b2463536 +size 561098185 diff --git a/full_models/cek/G_100000.pth b/full_models/cek/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e8b158fa9766fc5c5260683ae648e537cb8ceed2 --- /dev/null +++ b/full_models/cek/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac70991ebf122b94cc6b1ed2c22e059dedf0c1ea7f214d016884825e84a7e7e5 +size 436533441 diff --git a/full_models/cek/config.json b/full_models/cek/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cek/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cek/vocab.txt b/full_models/cek/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..995a8f03daf5f83ed178b19147f17b7e147fe8b0 --- /dev/null +++ b/full_models/cek/vocab.txt @@ -0,0 +1,37 @@ +r +q +x +k +n +b +j +f +g +' +z +p +3 +ä +s +h +a +w +1 +e +ü +ö +2 +m +d +0 +t +_ +c +o +y +l +i +- +u + +v diff --git a/full_models/cfm/D_100000.pth b/full_models/cfm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c907fd71d5875c8a6736612027ec52ed25e8a86b --- /dev/null +++ b/full_models/cfm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c74faf76ebe8f981d7edb666a0f7e3b9c7aae8f74302e840cb84c1cbdd439c +size 561078749 diff --git a/full_models/cfm/G_100000.pth b/full_models/cfm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..88a97c2bb1b68ae81bf135ecb5fde3b5fda2a338 --- /dev/null +++ b/full_models/cfm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4d55656c4e4e2e2fa8230fae863b83a3a9929a28f9478e98d1780863a8ee298 +size 436370778 diff --git a/full_models/cfm/config.json b/full_models/cfm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cfm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cfm/vocab.txt b/full_models/cfm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4adfa61ba1d9506ecc181e02418e37f49e3ae58f --- /dev/null +++ b/full_models/cfm/vocab.txt @@ -0,0 +1,34 @@ +| +a +n +h +i +u +t +l +k +m +e +g +s +r +p +c +w +o +d +z +b +ò +f +v +j +- +y +x +q +' +2 +­ +1 + diff --git a/full_models/cgc/D_100000.pth b/full_models/cgc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1e9bab9f28b123dbc72689b839671bc8e7bea9b8 --- /dev/null +++ b/full_models/cgc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6831429c0b3c038b048ca1225a9e843ca8a5474b03969788759e03aac50c57c +size 561098185 diff --git a/full_models/cgc/G_100000.pth b/full_models/cgc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..72ef48aafc561f587af3c424bf6bf7d0d881fc0a --- /dev/null +++ b/full_models/cgc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d94c49eb09d1db0b060004180a0ebfff74365546a78f742b8021387cec847063 +size 436519617 diff --git a/full_models/cgc/config.json b/full_models/cgc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cgc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cgc/vocab.txt b/full_models/cgc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..567755918e34f477a7bdb468cb1e812d087c3b90 --- /dev/null +++ b/full_models/cgc/vocab.txt @@ -0,0 +1,31 @@ +j +- +b +k +d +' +m +x +f +n +p +e +u +s +z +v +o +c +l +y + +r +i +6 +t +_ +w +q +h +g +a diff --git a/full_models/che/D_100000.pth b/full_models/che/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7e9c5bced4ad79eb29423e181d194c908a6e16e9 --- /dev/null +++ b/full_models/che/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:151fe45c2d7bab0f840c2d3b202611a24a314fe3a6aa655ce5aa9bfe42ef884c +size 561098185 diff --git a/full_models/che/G_100000.pth b/full_models/che/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ab92212900aa30a00f03f2615c64006ddd7b9aa --- /dev/null +++ b/full_models/che/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d129a7adfa25fe56ea1c1c249c31aaa0f3e81e67622146aa0d063d74b88e084 +size 436531137 diff --git a/full_models/che/config.json b/full_models/che/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/che/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/che/vocab.txt b/full_models/che/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a5251f6f291a341c3a953d39e3952a56207c6481 --- /dev/null +++ b/full_models/che/vocab.txt @@ -0,0 +1,36 @@ +р +ж +о +э +- +ц +т +х +ч +' +и +ю +м +б +_ +у +з +е +с +ӏ +г +л + +а +я +в +ъ +– +ш +н +й +ф +ь +д +к +п diff --git a/full_models/chf/D_100000.pth b/full_models/chf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4628da2beb8535acc69b7a5e4183f76557ac217d --- /dev/null +++ b/full_models/chf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69686a0517030514572965faa528a08728a22937dc4c2f1b92a35c6c559550ff +size 561076159 diff --git a/full_models/chf/G_100000.pth b/full_models/chf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..37e4dbb2e3d1b270a871c485f7eff5bafb48dff5 --- /dev/null +++ b/full_models/chf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d334c7f49d8bc52b282951e5238d487f0cb969264d113a59e7adff9ce7b1c4f2 +size 436355397 diff --git a/full_models/chf/config.json b/full_models/chf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/chf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/chf/vocab.txt b/full_models/chf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4824452b21a4239d5fa3dbe75bdd54aba22a3479 --- /dev/null +++ b/full_models/chf/vocab.txt @@ -0,0 +1,36 @@ +k +m +g +_ +d +w +h +ó +ñ +z +' +i +j +q +s +t +b +p +e +l +é +r +o +í +ú +ä +u +v +c +f + +á +n +y +x +a diff --git a/full_models/chv/D_100000.pth b/full_models/chv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7a2d72ff427150cee699326c818baa6599a44d6c --- /dev/null +++ b/full_models/chv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dba8dbb838073c29877c0e4a43fb9d7e3389dd29dcbadf7b4b323be85fcd6f7 +size 561078965 diff --git a/full_models/chv/G_100000.pth b/full_models/chv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e8bf2f6bc7a1379409a1515177d2415b16b80715 --- /dev/null +++ b/full_models/chv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc1d65faa0519856014c7162c81cb8e4487ac9a0346144644fa48ff5bb400e84 +size 436385681 diff --git a/full_models/chv/config.json b/full_models/chv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/chv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/chv/vocab.txt b/full_models/chv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a64635e10fd2f7cc8775709483abbb8ac8b819b5 --- /dev/null +++ b/full_models/chv/vocab.txt @@ -0,0 +1,39 @@ +| +а +н +е +р +ӑ +т +ӗ +с +л +п +и +у +м +х +к +ҫ +в +ч +ш +ы +й +э +ӳ +о +- +я +– +ь +ю +д +г +ф +з +щ +б +ж +ц + diff --git a/full_models/chz/D_100000.pth b/full_models/chz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..93a3811bfdd57df8ff28fe7e1e0a4f0757d2877b --- /dev/null +++ b/full_models/chz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ee2a4a926aa838b373e09446e17033ffb890057c9719e8e77f7592fc325b6db +size 561078373 diff --git a/full_models/chz/G_100000.pth b/full_models/chz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4669d3ed996042ff7738546603e12b81e4990616 --- /dev/null +++ b/full_models/chz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:639bfba41e240ef037e8ab9cfd8021ed869a8fafa80ce64115271c9339923a35 +size 436408119 diff --git a/full_models/chz/config.json b/full_models/chz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/chz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/chz/vocab.txt b/full_models/chz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6bb6023ef4fac8039ef43bd3b9ac5f5bbccc32ae --- /dev/null +++ b/full_models/chz/vocab.txt @@ -0,0 +1,51 @@ +| +a +h +̱ +ˉ +e +j +ꜙ +i +ˊ +ä +n +l +ꜗ +o +ꜘ +k +m +y +ë +s +g +d +u +ɨ +ˈ +t +w +c +ø +ʉ +b +r +ñ +ˋ +̃ +p +ꜚ +ú +— +é +í +ó +á +f +ʼ +z +v +q +x + diff --git a/full_models/cjo/D_100000.pth b/full_models/cjo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9c942d4d4ed6009c862201246ceb9cd8c3c5bfeb --- /dev/null +++ b/full_models/cjo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df55e23a8ea7339de57537bf1e1fc28296b7a664f81a9702f83f71306f7b7463 +size 561078629 diff --git a/full_models/cjo/G_100000.pth b/full_models/cjo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe8f66556fb3d5e9325661d8f4e049bf1a84d2ab --- /dev/null +++ b/full_models/cjo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3932adab7e2e587330754d02f5e4ffde2c6742ade2f1e0b43b4147a464e82672 +size 436373589 diff --git a/full_models/cjo/config.json b/full_models/cjo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cjo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cjo/vocab.txt b/full_models/cjo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9ce440a52eb59f023e022ca8b79df933f2c02a1f --- /dev/null +++ b/full_models/cjo/vocab.txt @@ -0,0 +1,36 @@ +e +1 +c +3 +o +s +n +h +_ +0 +4 +2 +k +— +6 +j +u +z +p +5 +m +g +a +v +w +ñ +9 + +r +t +8 +y +i +- +7 +' diff --git a/full_models/cjp/D_100000.pth b/full_models/cjp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ca58ecf4ee9e1d8932e4950d336d1f9230d5de65 --- /dev/null +++ b/full_models/cjp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a70677d80653d594975bdfd5f2fcc8d32b867830d5a7d675d417f170403e74 +size 561078625 diff --git a/full_models/cjp/G_100000.pth b/full_models/cjp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d233bd0f306b7dd06bb7be214933485c0150e450 --- /dev/null +++ b/full_models/cjp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:645be1b3941afacfed050fae9bb076632920e6d5c439eb0fa12e04629455d946 +size 436391355 diff --git a/full_models/cjp/config.json b/full_models/cjp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cjp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cjp/vocab.txt b/full_models/cjp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9b973d39307a299de638f718881bc71879eedc82 --- /dev/null +++ b/full_models/cjp/vocab.txt @@ -0,0 +1,43 @@ +| +a +i +k +e +̱ +ä +s +j +t +w +r +l +n +b +u +y +m +o +h +d +ñ +p +c +ö +á +à +í +ë +ú +é +— +g +v +f +z +ó +q +' +x +è +­ + diff --git a/full_models/cjs/D_100000.pth b/full_models/cjs/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7e3a93a1ad25a3894f7554de426444376bee55e --- /dev/null +++ b/full_models/cjs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f770a4f70054a4509c5718dd8627e79540bb30fcf2671c3ad5536e83cc5b78f +size 561076182 diff --git a/full_models/cjs/G_100000.pth b/full_models/cjs/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..71ad0c2ccac7a5e9b935add3e0d47535b4445a0f --- /dev/null +++ b/full_models/cjs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:335b40952ba8b1e4c4f291effb498d32a752253f4dd4ad1520e7fbbef91bd7e7 +size 436362566 diff --git a/full_models/cjs/config.json b/full_models/cjs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cjs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cjs/vocab.txt b/full_models/cjs/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..8f9a57891af534ba1b7925ebd28fbffbc04c34ad --- /dev/null +++ b/full_models/cjs/vocab.txt @@ -0,0 +1,39 @@ +| +а +е +и +р +н +ы +т +л +п +д +с +о +қ +ч +ғ +к +ң +м +у +й +з +б +г +– +ӱ +ш +ӧ +ж +э +- +ф +в +я +ё +х +ь +ц + diff --git a/full_models/cko/D_100000.pth b/full_models/cko/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3a9662af5bdca2f595a775797cecb19849d6a0f --- /dev/null +++ b/full_models/cko/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ddbdb48c26e59f34d2db989e93715f158a351c0605ef0b4d4c33b93cb56513f +size 561078879 diff --git a/full_models/cko/G_100000.pth b/full_models/cko/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7c08944ca6957f57aa482a8eb9410d5a8ee6ee37 --- /dev/null +++ b/full_models/cko/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db8871f0dcbf9fe091d36212ec0800653609d999feaa2e0b91d1be000a377a74 +size 436376834 diff --git a/full_models/cko/config.json b/full_models/cko/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cko/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cko/vocab.txt b/full_models/cko/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b581fb2225b988dd3f1f98c134f0dbe25b93001d --- /dev/null +++ b/full_models/cko/vocab.txt @@ -0,0 +1,36 @@ +| +a +i +n +m +ɛ +u +b +k +r +o +ɔ +s +y +e +t +d +w +f +ŋ +g +á +j +l +p +h +c +z +v +ó +í +ú +́ +é +' + diff --git a/full_models/ckt/D_100000.pth b/full_models/ckt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..291b2596bd641960e38caa801dd50c78143049c3 --- /dev/null +++ b/full_models/ckt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1bc5c2f1035a5712959a4e60590478764116916646dbf956d1c33927c15c0b +size 561076158 diff --git a/full_models/ckt/G_100000.pth b/full_models/ckt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..249638991d9dcd90cfedeeebe0cfba21673dcbfc --- /dev/null +++ b/full_models/ckt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d6565a7b54ad778e14c17c5e01ccf49016dc9ec2cc208cb3cc75b1c0bc718e6 +size 436362298 diff --git a/full_models/ckt/config.json b/full_models/ckt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ckt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ckt/vocab.txt b/full_models/ckt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c274c4d49e5855cd0bdcc0e29d8a3232809dcc06 --- /dev/null +++ b/full_models/ckt/vocab.txt @@ -0,0 +1,39 @@ +ы +| +н +э +т +а +и +к +р +ԓ +м +г +в +ъ +ӈ +ӄ +о +у +ь +ч +е +й +п +ё +с +я +- +– +ю +л +' +д +ф +з +х +б +ж +ц + diff --git a/full_models/cla/D_100000.pth b/full_models/cla/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9d2a4d99804f1d999774dea85bc62c534c47d0e9 --- /dev/null +++ b/full_models/cla/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f53a052e6e403cfddbe3f2b8c18ee55f30c83a630b7449d030e793ee7f019ad9 +size 561078721 diff --git a/full_models/cla/G_100000.pth b/full_models/cla/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4474a364e1d4b850633197dbb9276e4f55485ce7 --- /dev/null +++ b/full_models/cla/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf86a8851dfa7eb87208ffa229ef9c54313894f9cfca577909582098c033d99 +size 436366412 diff --git a/full_models/cla/config.json b/full_models/cla/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cla/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cla/vocab.txt b/full_models/cla/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0d7ed157688845e34cb370a608d8cf66f794b520 --- /dev/null +++ b/full_models/cla/vocab.txt @@ -0,0 +1,32 @@ +| +a +i +m +s +n +t +u +e +k +h +w +l +y +o +f +g +r +ɓ +d +ɗ +' +b +p +c +j +z +v +- +2 +0 + diff --git a/full_models/cle/D_100000.pth b/full_models/cle/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0334d36fefb13ee59e7cd385ef4bd1819cc523df --- /dev/null +++ b/full_models/cle/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28d5865bc167f6c9a33a52d8494a5471426994afa6e04ea9766e46cac93942e +size 561076182 diff --git a/full_models/cle/G_100000.pth b/full_models/cle/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a50b21cce575cf840a755405a0d0a262c6987300 --- /dev/null +++ b/full_models/cle/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1750d64f3a5ed808e97780a774afb4a5485317e240b9afc850ed2beba246f21d +size 436374228 diff --git a/full_models/cle/config.json b/full_models/cle/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cle/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cle/vocab.txt b/full_models/cle/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b3bc98d4ec1eebbe14a8a57af7426881a82c6e33 --- /dev/null +++ b/full_models/cle/vocab.txt @@ -0,0 +1,44 @@ +| +3 +h +a +i +4 +2 +á +̱ +ɨ +j +d +y +c +e +n +l +s +u +m +x +1 +g +o +í +é +b +́ +t +ú +f +ñ +ó +r +v +p +ŋ +ü +z +q +k +- +' + diff --git a/full_models/cly/D_100000.pth b/full_models/cly/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0e4304c3ceee7a5666b6d04c780e1c279d7b455f --- /dev/null +++ b/full_models/cly/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:719a882ba4c32d36c7fba9d1fd5954f29356c12391e12826e608530ae385defc +size 561078738 diff --git a/full_models/cly/G_100000.pth b/full_models/cly/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f7a24981ae3b3f401521b66caabdabc1d16b05d5 --- /dev/null +++ b/full_models/cly/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac9eb89c3bfe8c7cac248019a53cff9983d20343142e432577d408997a19f839 +size 436379355 diff --git a/full_models/cly/config.json b/full_models/cly/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cly/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cly/vocab.txt b/full_models/cly/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..74ce798610b514cccb8c3334df768848e93ee6c9 --- /dev/null +++ b/full_models/cly/vocab.txt @@ -0,0 +1,38 @@ +q + +z +p +— +j +m +g +f +e +b +l +n +ó +t +é +_ +- +ú +o +ü +y +x +' +u +i +h +s +á +c +d +r +a +ñ +́ +í +v +k diff --git a/full_models/cme/D_100000.pth b/full_models/cme/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..52e435ded708bde4eaa88b5d0450cb9eb73a1466 --- /dev/null +++ b/full_models/cme/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b2faf0c0a1d75595ea5c884ca4f8dd50fe8a63282ab674549d9cf989489b52 +size 561078603 diff --git a/full_models/cme/G_100000.pth b/full_models/cme/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..67f7ba3f72ff140d11a52ad139b08b1fb6a10e76 --- /dev/null +++ b/full_models/cme/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71157d4476792cd720605f5f33ff082f5958d036185c11da5f3cc098087f6005 +size 436373569 diff --git a/full_models/cme/config.json b/full_models/cme/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cme/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cme/vocab.txt b/full_models/cme/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9ceeaac090f65e89f7611cee4eb7cd7fcfb78264 --- /dev/null +++ b/full_models/cme/vocab.txt @@ -0,0 +1,36 @@ +| +a +i +u +ŋ +n +m +b +e +o +l +ɔ +- +d +ɛ +y +r +s +k +‐ +g +t +ã +h +c +w +f +ĩ +p +j +ũ +̃ +' +v +— + diff --git a/full_models/cmo-script_khmer/D_100000.pth b/full_models/cmo-script_khmer/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0926795682550b170f47701e1693c5b34d15a64f --- /dev/null +++ b/full_models/cmo-script_khmer/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad697b8127f2b5962ac3a01248ef9763274100664fa6572e7ece1d367b6318d +size 561078882 diff --git a/full_models/cmo-script_khmer/G_100000.pth b/full_models/cmo-script_khmer/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..032ba63d27e236bf5682e4479ee0262bbbbdcdd1 --- /dev/null +++ b/full_models/cmo-script_khmer/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2bb5aaa5f9661fb83de198243d5280552fbf553c7de882ee9ddc068f083832 +size 436421803 diff --git a/full_models/cmo-script_khmer/config.json b/full_models/cmo-script_khmer/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cmo-script_khmer/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cmo-script_khmer/vocab.txt b/full_models/cmo-script_khmer/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c7972883723a250ce2c193a652908fd3eec0e788 --- /dev/null +++ b/full_models/cmo-script_khmer/vocab.txt @@ -0,0 +1,56 @@ +ច +៨ +៦ +ឺ +ខ +ែ +ើ +ី +ទ +ា +ញ +ឞ +ូ +វ +ន +អ +ឆ +១ +០ +៩ +៤ +៥ +២ +រ +ោ +ៈ +ឹ +ម +ស +ផ +ប +៧ +ដ +់ +ៀ +_ +គ +៣ +ព + +យ +- +ល +ក +្ +ង +ជ +ត +៝ +េ +ៅ +ហ +ុ +ិ +ថ +ៃ diff --git a/full_models/cmo-script_latin/D_100000.pth b/full_models/cmo-script_latin/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..30cdb99086f5dc1309960b73b736219be839755a --- /dev/null +++ b/full_models/cmo-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928b21981d556f4dcbde2a14c39a48eb12636f132e71881ff100b6636cb7bc87 +size 561077728 diff --git a/full_models/cmo-script_latin/G_100000.pth b/full_models/cmo-script_latin/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..bfe361d2f5d92584d23a853e4d4b4b06fd91054e --- /dev/null +++ b/full_models/cmo-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ac3dfee64916eeb50c3c91b6c4db081e0d11c1e304a5a433599247deddb6d4 +size 436397105 diff --git a/full_models/cmo-script_latin/config.json b/full_models/cmo-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cmo-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cmo-script_latin/vocab.txt b/full_models/cmo-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..89e2ad9671bbae4f2b68eddf68814ac7288229a5 --- /dev/null +++ b/full_models/cmo-script_latin/vocab.txt @@ -0,0 +1,48 @@ +| +n +a +h +g +m +r +u +â +k +i +t +ă +y +l +p +b +ơ +d +ô +ê +j +e +o +s +ŏ +ŭ +đ +c +ĕ +ƀ +' +̆ +v +ĭ +0 +ư +1 +- +2 +4 +5 +3 +6 +7 +9 +8 + diff --git a/full_models/cmr/D_100000.pth b/full_models/cmr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..56e47c625c1a6c9ba048882b82f2b6af5e6b3bf5 --- /dev/null +++ b/full_models/cmr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41841f0719cf9aa9e9e79c3ca8027a7686b93549e93bcfe49227e9d2bb59ddba +size 561078851 diff --git a/full_models/cmr/G_100000.pth b/full_models/cmr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4a1a2c0b4f5fa0a4ba848b99292427f02043f02c --- /dev/null +++ b/full_models/cmr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11f6879968391822083a6b0f645a43432d2d570e832787ea71a47aa1bcc9f68 +size 436373134 diff --git a/full_models/cmr/config.json b/full_models/cmr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cmr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cmr/vocab.txt b/full_models/cmr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a445d47870d58adc3e5b074c072ae2c22f9ca05b --- /dev/null +++ b/full_models/cmr/vocab.txt @@ -0,0 +1,35 @@ +k +o + +j +0 +v +i +z +q +p +d +r +w +f +6 +e +y +' +u +- +a +s +3 +h +b +m +n +1 +l +_ +2 +g +4 +x +t diff --git a/full_models/cnh/D_100000.pth b/full_models/cnh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b77432fb4129c502567512831c1431c959bab7ac --- /dev/null +++ b/full_models/cnh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0adcbe7733dfbb993e5aea6d0f062dce961aac1efe7b1c38d6df63c1e01231 +size 561078869 diff --git a/full_models/cnh/G_100000.pth b/full_models/cnh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81bb889ccfaae5c628df0e577b033f367ab7030d --- /dev/null +++ b/full_models/cnh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c75560deb730c12fdd369c2cbe84b451d64c5cca45ee65be6df5b031e4cbf8 +size 436361733 diff --git a/full_models/cnh/config.json b/full_models/cnh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cnh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cnh/vocab.txt b/full_models/cnh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..78856966f84d3ae77b47589db031841ed71ce090 --- /dev/null +++ b/full_models/cnh/vocab.txt @@ -0,0 +1,30 @@ +i +n +e +f +p +g +w +m +a + +o +j +t +y +- +_ +l +z +' +k +c +ṭ +— +b +s +v +d +u +h +r diff --git a/full_models/cni/D_100000.pth b/full_models/cni/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ae02719faa4fcf1a1bf13aba5f4fd15ce3de6c1f --- /dev/null +++ b/full_models/cni/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5dac455f983b3599ea3dacd397e31bb99dd0d73ee3384da686b7026167cf3b +size 561078614 diff --git a/full_models/cni/G_100000.pth b/full_models/cni/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7f0f680adab889ee89ae1bf7039f8e3ee3920d2 --- /dev/null +++ b/full_models/cni/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3626d9397a9b99bba4c0433740ab39297691e7236612d63117e6e8803423d263 +size 436362056 diff --git a/full_models/cni/config.json b/full_models/cni/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cni/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cni/vocab.txt b/full_models/cni/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fcdcaab81aabb9c323592cc70a105e6c01d7a308 --- /dev/null +++ b/full_models/cni/vocab.txt @@ -0,0 +1,31 @@ +a +i +| +e +t +n +r +o +s +c +p +q +u +m +j +h +v +y +- +0 +' +1 +2 +7 +4 +6 +5 +8 +3 +9 + diff --git a/full_models/cnl/D_100000.pth b/full_models/cnl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..228bc4d524ab6b5aa227b2084af4eddf0b96e736 --- /dev/null +++ b/full_models/cnl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e727aa19d1ca0c8b25136578fb0313884e002e22db1ff2b579b437191057133 +size 561076156 diff --git a/full_models/cnl/G_100000.pth b/full_models/cnl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6e1d586d5230683187ca29382acdd45f17ad7a87 --- /dev/null +++ b/full_models/cnl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8706d60c03bf183c849b989f68d530e33b952e6a6495f4ddd4946ba4ab729d99 +size 436376482 diff --git a/full_models/cnl/config.json b/full_models/cnl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cnl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cnl/vocab.txt b/full_models/cnl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6c7d3c3801cc2930898722d0dc2cd77c95fb527c --- /dev/null +++ b/full_models/cnl/vocab.txt @@ -0,0 +1,45 @@ +1 + +y +v +r +á +z +k +ñ +ó +j +́ +n +s +_ +e +é +í +u +ŋ +ʉ +ü +h +' +g +i +̱ +a +t +x +ǿ +c +ɨ +b +q +o +ú +f +2 +ø +m +d +p +3 +l diff --git a/full_models/cnt/D_100000.pth b/full_models/cnt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..86653df124bae5cd0a62bf284d4840b80ccb24e7 --- /dev/null +++ b/full_models/cnt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:511140dd7bda53d5f36392aeb47071f27a586e1b5d94a32dd13bbc68e7902c59 +size 561078073 diff --git a/full_models/cnt/G_100000.pth b/full_models/cnt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6c2720833a6c2ee5b7c4a97251b641de4a3c751c --- /dev/null +++ b/full_models/cnt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24454a38241841c3feac76a3846951d0ad7caea2e98e774e8f9108b1bfc53afd +size 436394299 diff --git a/full_models/cnt/config.json b/full_models/cnt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cnt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cnt/vocab.txt b/full_models/cnt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..327ba952b47338e1293e58a4a30a547ad7b7abbd --- /dev/null +++ b/full_models/cnt/vocab.txt @@ -0,0 +1,45 @@ +| +2 +a +' +i +n +j +u +4 +5 +3 +g +e +s +c +á +ɨ +1 +l +o +d +ë +m +t +́ +q +ó +é +ŋ +b +r +h +ú +í +p +ü +- +f +v +z +y +k +x +ñ + diff --git a/full_models/coe/D_100000.pth b/full_models/coe/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b8b2b7bb6739fdc933e582b5cdc296184edd5dd7 --- /dev/null +++ b/full_models/coe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9b8d2876cc221ca4d4e731243bc31edf2b1c34c77b0dc8c6f19d49098e83609 +size 561076186 diff --git a/full_models/coe/G_100000.pth b/full_models/coe/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3393aac42b61e5d213e2ac95338b391c1fd8464a --- /dev/null +++ b/full_models/coe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169c568e9f536771881faff6ddd79ac5fe9c02d80318bc6da2129299444369f5 +size 436369702 diff --git a/full_models/coe/config.json b/full_models/coe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/coe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/coe/vocab.txt b/full_models/coe/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f10cbd5f129758f86e7a768d218b3797cb6f59a7 --- /dev/null +++ b/full_models/coe/vocab.txt @@ -0,0 +1,42 @@ +a +| +ʉ +e +' +i +c +o +h +n +r +j +s +m +p +k +u +t +ã +ñ +v +ũ +d +̃ +ẽ +ĩ +— +l +õ +ú +í +b +g +é +f +á +q +ó +z +y +x + diff --git a/full_models/cof/D_100000.pth b/full_models/cof/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ce917c6f027d34702a4e00c7fe941012f5450393 --- /dev/null +++ b/full_models/cof/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0911ee9211633669dc6bc5b66ab38759ae17e6be43d9c19a5e15261a8aa29878 +size 561078711 diff --git a/full_models/cof/G_100000.pth b/full_models/cof/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a849900a64c2ac8c6ae4fa8ff3e0574c09177bd1 --- /dev/null +++ b/full_models/cof/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbc987596c8b545730db6ebfd362fe1bfb398e225b8054335901d85471162c0 +size 436368980 diff --git a/full_models/cof/config.json b/full_models/cof/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cof/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cof/vocab.txt b/full_models/cof/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..444dd18c775c454ca8e99dfb1975e934a3b453d1 --- /dev/null +++ b/full_models/cof/vocab.txt @@ -0,0 +1,34 @@ +a +p +r +í +i +o +v +t +ñ + +é +f +j +g +ó +á +ú +m +c +h +y +d +z +b +n +u +l +x +q +— +w +_ +s +e diff --git a/full_models/cok/D_100000.pth b/full_models/cok/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..60f8c176d30a4bdb1e4dfa6f4e7d8a46ecd84dd3 --- /dev/null +++ b/full_models/cok/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12c3a893b0535db88c0002cc63f41302b03124060e81acf7db5578f10e2fb91 +size 561078709 diff --git a/full_models/cok/G_100000.pth b/full_models/cok/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..62d386dc66698f4b43343bf386bc5f616afdaa4c --- /dev/null +++ b/full_models/cok/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15fd1a478f1240b5da7026444bc44e447200e7e31eff9918797eec3a38ef31a2 +size 436375635 diff --git a/full_models/cok/config.json b/full_models/cok/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cok/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cok/vocab.txt b/full_models/cok/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b29d7dbd4e1b3146739b401658ac44194905f8a2 --- /dev/null +++ b/full_models/cok/vocab.txt @@ -0,0 +1,37 @@ +d +r +' +ñ +l +ú +a +h +x +b +m +- +c +ɨ +g +í +p +n +j +u +é +́ +o +t +ó + +q +á +s +i +v +z +f +k +y +e +_ diff --git a/full_models/con/D_100000.pth b/full_models/con/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf30822a9a2d04d905b49147b1adbfec4ca7bb89 --- /dev/null +++ b/full_models/con/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b305cb8995b85072d0845f6ed24f108491d32bf232ddb0dedfe0ba4c1a4d176 +size 561078704 diff --git a/full_models/con/G_100000.pth b/full_models/con/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e3a026205a5b1b8145c50474ebf90a8e0a599b4 --- /dev/null +++ b/full_models/con/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae477bb52f3581f886876f12ff0edc4db5ee0a1640e638330bf78a21edb93e9 +size 436375981 diff --git a/full_models/con/config.json b/full_models/con/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/con/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/con/vocab.txt b/full_models/con/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..206db65592c40f3f778482bc6316f7dd024142fd --- /dev/null +++ b/full_models/con/vocab.txt @@ -0,0 +1,37 @@ +a +| +e +i +n +s +' +c +t +u +o +m +j +q +h +g +p +f +d +y +ñ +b +v +r +ú +l +— +é +- +z +á +í +ó +x +k +ḿ + diff --git a/full_models/cot/D_100000.pth b/full_models/cot/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5d3fcb5fd5a98f62a49b8a82534ed0a6123396a7 --- /dev/null +++ b/full_models/cot/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc5782f95fa4762a4304cce9a12be477652c1b96dd9dc151e62f878964b167b +size 561078209 diff --git a/full_models/cot/G_100000.pth b/full_models/cot/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fdc4da46400d2099b30d71f26eb0b1cdc1280d2b --- /dev/null +++ b/full_models/cot/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e740c204108b39d9f81c4db40554b8e249bccdd201ccebb9ef26e1b806013d +size 436387289 diff --git a/full_models/cot/config.json b/full_models/cot/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cot/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cot/vocab.txt b/full_models/cot/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..79dcd07bb8f3781220293c64019ae432697276f4 --- /dev/null +++ b/full_models/cot/vocab.txt @@ -0,0 +1,42 @@ +a +7 +i +r +y +5 +o +q +9 +j +u +ó +e +_ +4 +p +b +' +v +3 +é +g +2 +l +m +0 +8 +x +s +— +z +f +ñ + +6 +1 +í +n +c +h +t +d diff --git a/full_models/cou/D_100000.pth b/full_models/cou/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..30a1c7b8b2d1e7c88241f19b0f9fdb6396250af4 --- /dev/null +++ b/full_models/cou/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496f471383a2f7f80480d40e47cca50105ac105166b63ac6b75c307d092fbc9a +size 561079110 diff --git a/full_models/cou/G_100000.pth b/full_models/cou/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..326d3ed82a6ef75f766b40c3fb16786d392d8eef --- /dev/null +++ b/full_models/cou/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d60a755b7bbb6881dee1ac98c328b64ae0384d3e2d3adee8763c62b1a7abf01 +size 436382292 diff --git a/full_models/cou/config.json b/full_models/cou/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cou/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cou/vocab.txt b/full_models/cou/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fb7ac7317698f15b06f36bd2215c95e8f55ddf8d --- /dev/null +++ b/full_models/cou/vocab.txt @@ -0,0 +1,37 @@ +| +a +ë +n +h +i +k +e +w +o +u +t +r +l +v +y +m +s +f +ɗ +̃ +d +ŋ +g +p +c +ỹ +ɓ +j +b +ƴ +ñ +' +- +á +— + diff --git a/full_models/cpa/D_100000.pth b/full_models/cpa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..415b758b8162c04b592ae17cb10da8272ee85083 --- /dev/null +++ b/full_models/cpa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69c616f90c0b8ffeaf9af7a63689d420639bcdd75d9ef9eacdc7ef0da48085c +size 561078639 diff --git a/full_models/cpa/G_100000.pth b/full_models/cpa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..71f4aa7a27d35d53e0cf7666f912e73c2840ccad --- /dev/null +++ b/full_models/cpa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784286e8bdacb7b2d05852864ae6499c477fcde97e97ea4a6d253ddf7a8ef7e9 +size 436387404 diff --git a/full_models/cpa/config.json b/full_models/cpa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cpa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cpa/vocab.txt b/full_models/cpa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..54e81302531346da54e5e333c7d2e5e2adc5ddf7 --- /dev/null +++ b/full_models/cpa/vocab.txt @@ -0,0 +1,42 @@ +3 +ø +́ +q +1 +ó +f +_ +b +x +l +t +u +i +n +g +ǿ +ŋ +r +k +z +ë +s +ñ +í +ú +m +j + +c +ü +2 +é +á +y +o +v +d +p +h +a +e diff --git a/full_models/cpb/D_100000.pth b/full_models/cpb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..073a4a032b080a78969115003055add93de3441c --- /dev/null +++ b/full_models/cpb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2f8556134f75bb536ab3cf868a643f2a97827f20ec36c0add610a90eb301c0 +size 561078969 diff --git a/full_models/cpb/G_100000.pth b/full_models/cpb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b38e0819d7d8f281d930db754b631a0036117140 --- /dev/null +++ b/full_models/cpb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f31f655297f92e7af9f3e304a57842fe71ed7374431391e759cae58e36f403d +size 436399715 diff --git a/full_models/cpb/config.json b/full_models/cpb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cpb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cpb/vocab.txt b/full_models/cpb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f4981388987c6f9ce8b2cdb37a6630e606aa1181 --- /dev/null +++ b/full_models/cpb/vocab.txt @@ -0,0 +1,46 @@ +_ +n +t +p +c +é +6 +s +ñ +8 + +b +í +x +h +9 +v +á +m +0 +3 +4 +z +u +q +' +w +ú +7 +5 +2 +i +l +o +f +y +g +r +j +d +a +1 +- +k +ó +e diff --git a/full_models/cpu/D_100000.pth b/full_models/cpu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0109236b7973d721bea9a3ea0080dcf7bfa8bf4f --- /dev/null +++ b/full_models/cpu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2db5460b80378dc07866a6a9db10b63fb27f2408da4434fdb1a16c207a9488e4 +size 561078959 diff --git a/full_models/cpu/G_100000.pth b/full_models/cpu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..01d83ad7e20882b43422b50b42a45da5c90e8168 --- /dev/null +++ b/full_models/cpu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f9b80784ee642a3a603e00d0bea7fce6790a9294f3b210c52a2b36ce551c560 +size 436395089 diff --git a/full_models/cpu/config.json b/full_models/cpu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cpu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cpu/vocab.txt b/full_models/cpu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c0fbb2e51f8d13d5c673ba2e25e2640cb1651872 --- /dev/null +++ b/full_models/cpu/vocab.txt @@ -0,0 +1,44 @@ +1 +g +4 +h +9 +e +2 +k +_ +x +- +r +á +ñ +m +7 +c + +n +b +0 +j +ú +5 +a +p +y +l +i +6 +v +8 +z +í +t +f +ó +3 +d +u +s +é +q +o diff --git a/full_models/crh/D_100000.pth b/full_models/crh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..627f7ee20faf27b38fd8f2dff048f4e5dde4e113 --- /dev/null +++ b/full_models/crh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda4083a0cacebc5b715d02d7c64ecc586c131df3b323a960fd980cc195785c6 +size 561079150 diff --git a/full_models/crh/G_100000.pth b/full_models/crh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2cf874889f66d7927440165d41e3f85493912737 --- /dev/null +++ b/full_models/crh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cfb8eb90c3ee44c1e2519d3eca29ca7567daa98bbdcc2577c2a522f8d7cb122 +size 436397121 diff --git a/full_models/crh/config.json b/full_models/crh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/crh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/crh/vocab.txt b/full_models/crh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5e24f94ea558a2c53c08ae0397fdccfd871cfa7d --- /dev/null +++ b/full_models/crh/vocab.txt @@ -0,0 +1,44 @@ +а +6 +5 +е +ж +ы +4 +и +к +0 +р +ш +ч +д +б +з +ю +п +х +- +н +э + +ъ +й +ё +я +– +ц +м +7 +в +_ +л +о +1 +г +3 +у +ф +ь +т +2 +с diff --git a/full_models/crk-script_latin/D_100000.pth b/full_models/crk-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fbc13a2e287ca5473f06a2cf113faae6c06fb17e --- /dev/null +++ b/full_models/crk-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3956d827c324ac381289f813fcf4b17ed6cb1aa0cbb3eed6f6762a6048b9074e +size 561078639 diff --git a/full_models/crk-script_latin/G_100000.pth b/full_models/crk-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1e4968f9034db4a9e456ecc3b208663d367f399 --- /dev/null +++ b/full_models/crk-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834064c3af856b81df04465c8a38a4b26b1511bb1613207d0ce80db9d9ca195b +size 436373404 diff --git a/full_models/crk-script_latin/config.json b/full_models/crk-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/crk-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/crk-script_latin/vocab.txt b/full_models/crk-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9036e1a75dde584019b9ed0bdff7795ca6d53cc6 --- /dev/null +++ b/full_models/crk-script_latin/vocab.txt @@ -0,0 +1,36 @@ +m +a +c +q +— +r +y +x +e +ē +_ + +l +o +n +d +p +' +ā +k +f +w +j +- +i +ō +h +b +g +s +ī +u +v +z +t +‐ diff --git a/full_models/crk-script_syllabics/D_100000.pth b/full_models/crk-script_syllabics/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..defc07abad5fc446360ff80e70536d5af0b6036d --- /dev/null +++ b/full_models/crk-script_syllabics/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0fea206dae0d57c0784767c0e6c65410ae355174f5da291453e32c0150cf945 +size 561079247 diff --git a/full_models/crk-script_syllabics/G_100000.pth b/full_models/crk-script_syllabics/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9a0d098b89c1aeddafc7d8b9fb7fedbee79821cb --- /dev/null +++ b/full_models/crk-script_syllabics/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6800e9c8351dde5716eae71b16d4a2168206d4f03c6d612c2307add3309ed194 +size 436478390 diff --git a/full_models/crk-script_syllabics/config.json b/full_models/crk-script_syllabics/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/crk-script_syllabics/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/crk-script_syllabics/vocab.txt b/full_models/crk-script_syllabics/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..716e2952dece7eb53d12fa447f2375c955707f1d --- /dev/null +++ b/full_models/crk-script_syllabics/vocab.txt @@ -0,0 +1,79 @@ +| +ᐧ +ᑭ +ᐃ +ᐊ +ᐁ +ᓯ +ᑲ +ᑕ +ᐦ +ᓂ +ᐢ +ᒋ +ᒥ +ᐠ +ᓇ +ᑳ +ᑯ +ᔨ +ᐅ +ᒫ +ᔭ +ᒪ +ᐤ +ᐋ +ᐣ +ᐟ +ᑫ +ᑎ +ᕽ +ᐱ +ᑖ +ᑌ +ᑐ +ᔮ +ᐸ +ᐯ +ᓈ +ᓴ +ᒧ +ᓱ +ᔦ +ᓭ +ᒣ +ᐨ +ᓀ +ᓄ +ᕒ +ᐳ +ᑦ +ᓵ +ᓬ +ᒉ +ᔪ +ᒑ +ᐹ +ᐩ +ᑊ +ᒍ +ᒐ +ᐆ +ᑰ +ᑮ +h +ᒼ +ᒨ +ᓲ +ᑑ +ᓃ +ᓅ +ᓰ +ᒦ +ᐴ +ᒌ +ᐄ +t +9 +7 + diff --git a/full_models/crn/D_100000.pth b/full_models/crn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2976f2b36ca815bd8d8ac591b08804f20c627b55 --- /dev/null +++ b/full_models/crn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc91d1e0a6fdab1e2e0a246d20dab6d67849cb61ca59901c9e4dc4369be664da +size 561076069 diff --git a/full_models/crn/G_100000.pth b/full_models/crn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0d06f6596bdeb3cac39987d791bfac7b919ccdbd --- /dev/null +++ b/full_models/crn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb8c24623e3b5c19c0af1f906467b1d2e5eac2d0a015c6aab989809a1164fea +size 436358057 diff --git a/full_models/crn/config.json b/full_models/crn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/crn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/crn/vocab.txt b/full_models/crn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3ab197ca3d4ce02bc74be31a2138601bb8043977 --- /dev/null +++ b/full_models/crn/vocab.txt @@ -0,0 +1,37 @@ +a +| +' +t +u +e +i +ɨ +j +n +m +y +r +c +h +s +p +x +v +z +o +á +d +l +ú +é +í +q +b +f +g +́ +ó +ñ +k +à + diff --git a/full_models/crq/D_100000.pth b/full_models/crq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0d56495af26130dedab0d3ea98c358f4084af6b5 --- /dev/null +++ b/full_models/crq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31bdaea8bd8e1347eddad9ea9f2705bb0e6648504507c1bd8b787dff603f738b +size 561076188 diff --git a/full_models/crq/G_100000.pth b/full_models/crq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49eca7e86c2f5696a5651d5d17022d03bfa3df54 --- /dev/null +++ b/full_models/crq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f083e7eb4ddf9d716d6ab94378b38962950937c66649a4e018b3e58b948a88d +size 436380967 diff --git a/full_models/crq/config.json b/full_models/crq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/crq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/crq/vocab.txt b/full_models/crq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..55090c26dcbfc5259397513d36919cfa75061347 --- /dev/null +++ b/full_models/crq/vocab.txt @@ -0,0 +1,47 @@ +é +e +q +g +ó +v +p +- +t +l +z +á +f +x +o +4 +8 +2 +j +y +3 +w +0 +– +ñ +6 +' +b +u +í +5 +s +a +ú +d +_ + +9 +n +h +c +7 +1 +k +r +m +i diff --git a/full_models/crs/D_100000.pth b/full_models/crs/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9883b0d870498c0b268659270f126231c17c33b8 --- /dev/null +++ b/full_models/crs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8213d8866c349fb47a1f3573925f2e62166679d212344f26379850e3f264e80a +size 561078883 diff --git a/full_models/crs/G_100000.pth b/full_models/crs/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cf75f0770e1af100f56fc23552bc3b5b6ac86e2b --- /dev/null +++ b/full_models/crs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eb126b97f2ffd9c1bb5b8fa87b51cf0fd59b537bf131ca9fefc2b761679aa2f +size 436378476 diff --git a/full_models/crs/config.json b/full_models/crs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/crs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/crs/vocab.txt b/full_models/crs/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b24cc35103adca6da8b1829f2ecb82486752a199 --- /dev/null +++ b/full_models/crs/vocab.txt @@ -0,0 +1,36 @@ +9 +r + +z +n +l +5 +8 +d +t +2 +g +4 +y +m +h +b +s +0 +7 +w +' +f +a +p +k +v +e +o +1 +i +- +u +3 +6 +_ diff --git a/full_models/crt/D_100000.pth b/full_models/crt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..38c2f60259b8351dc9ff7737a6923a069e763c68 --- /dev/null +++ b/full_models/crt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae914fc21d7ed5ca157c3096ff0ffbdc83424206c29a2232104b4d472164d628 +size 561078632 diff --git a/full_models/crt/G_100000.pth b/full_models/crt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c6cde1287babee27dd3af327a998c730a7905899 --- /dev/null +++ b/full_models/crt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7791f93b5f544493e1eccabdca791e1bd858856c01c8297c5d87f157685afe8e +size 436382777 diff --git a/full_models/crt/config.json b/full_models/crt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/crt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/crt/vocab.txt b/full_models/crt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7e05c8474d4ae3a755a278316b949cf02c2bae59 --- /dev/null +++ b/full_models/crt/vocab.txt @@ -0,0 +1,40 @@ +l +í +t +w +ú +- +c +r +q +9 +g +4 +m +s +á + +k +— +ñ +x +p +b +y +a +e +_ +o +' +f +ó +z +d +0 +j +h +u +v +n +é +i diff --git a/full_models/csk/D_100000.pth b/full_models/csk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f87de96e1a540040663644fab5c4f27e974a1380 --- /dev/null +++ b/full_models/csk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e98b7c2cf4d3d12b40ac01b2fa4f571d10b6347689be71e800e89ad4a224e24 +size 561078837 diff --git a/full_models/csk/G_100000.pth b/full_models/csk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b7ee222af39f724ae444b3d5916000d18c6c70e0 --- /dev/null +++ b/full_models/csk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b339cc010a13821fe6772dfd68ff48568f8ecc0d4d2f8c9a2b62591a71f1618 +size 436371759 diff --git a/full_models/csk/config.json b/full_models/csk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/csk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/csk/vocab.txt b/full_models/csk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1869defd9a4dd9e25a7d3aff64ca2611446887f3 --- /dev/null +++ b/full_models/csk/vocab.txt @@ -0,0 +1,34 @@ +| +a +u +l +i +o +k +n +e +m +b +t +y +w +j +h +s +f +á +ú +ŋ +ñ +é +̥ +í +g +ó +ˈ +c +d +— +' +- + diff --git a/full_models/cso/D_100000.pth b/full_models/cso/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d27951edc83e80f58c3c9a456fe9afda471b7522 --- /dev/null +++ b/full_models/cso/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b33d3ed4effbc9f81583250d7fc48a6f04d8e1be7378f0747d2db65abf3be3 +size 561076198 diff --git a/full_models/cso/G_100000.pth b/full_models/cso/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..223ffd416d20d2433eb71a1a9e2f611a8c88774c --- /dev/null +++ b/full_models/cso/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73161a57f20cad4ef0237f2aaf9cdd6cb293ad8b3fc9a02ae5b9ce298a9b0f75 +size 436362711 diff --git a/full_models/cso/config.json b/full_models/cso/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cso/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cso/vocab.txt b/full_models/cso/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..445e96c3767b5a797a0785eaa7df7e54b879fae5 --- /dev/null +++ b/full_models/cso/vocab.txt @@ -0,0 +1,39 @@ + +í +y +ë +g +e +f +d +é +a +v +k +ñ +j +m +o +h +ɨ +3 +́ +ó +2 +ú +z +c +t +_ +l +q +n +1 +x +b +i +s +u +p +r +á diff --git a/full_models/ctd/D_100000.pth b/full_models/ctd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ff9ff7607e9c820b1f1f85e0dea0476fe887905 --- /dev/null +++ b/full_models/ctd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c24be982658f99d51097f11d02a4be31794c89b91eaf6086c7cdc29c26b19d4 +size 561078763 diff --git a/full_models/ctd/G_100000.pth b/full_models/ctd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d38fe322aa9c6251280c1c46cd4a23af8dba17b3 --- /dev/null +++ b/full_models/ctd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55c35f466092d88a700b787a28ae4c3f29de1b1162f1431881be8888b6d2034 +size 436361397 diff --git a/full_models/ctd/config.json b/full_models/ctd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ctd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ctd/vocab.txt b/full_models/ctd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d3a50077babc1cb1aa588b8d9a35c5240521199f --- /dev/null +++ b/full_models/ctd/vocab.txt @@ -0,0 +1,30 @@ +| +a +i +n +h +t +u +g +e +k +m +p +l +o +s +w +d +c +z +b +- +v +j +r +f +y +' +x +q + diff --git a/full_models/ctg/D_100000.pth b/full_models/ctg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5e10df1612a4230cc84b80fc1552595dc452bf10 --- /dev/null +++ b/full_models/ctg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1794f1f356a8118e35516a524bd569d66ccd6ad5bdfc1bf2d426f6c52f22722c +size 561078968 diff --git a/full_models/ctg/G_100000.pth b/full_models/ctg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f8814fb3984b49acc81733167310f5dbde5c4e11 --- /dev/null +++ b/full_models/ctg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78a55797b9d6d3c071527b861a1c553b39219ba2946a15aa377c026f67a7e07 +size 436432614 diff --git a/full_models/ctg/config.json b/full_models/ctg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ctg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ctg/vocab.txt b/full_models/ctg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d7a890fce690aa1f8b7a723f36afd1050a542ca5 --- /dev/null +++ b/full_models/ctg/vocab.txt @@ -0,0 +1,60 @@ +ত +খ +ী +অ +_ +এ +ও +ঃ +ষ +— +ড +ূ +উ +গ +ে +ই + +ফ +ভ +' +ঞ +চ +ং +ঢ +ব +দ +হ +ন +য +– +ৈ +ু +থ +স +ঠ +ৌ +ট +জ +় +ি +ঐ +ল +ঝ +ঘ +ঊ +ঁ +আ +ো +া +ক +‍ +ছ +ম +প +শ +্ +ধ +- +ৃ +র diff --git a/full_models/cto/D_100000.pth b/full_models/cto/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..66c0806181f3ffeca9d937b50092262005603195 --- /dev/null +++ b/full_models/cto/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f6aae30502e51bcf481f9787f4b627bf51a729bd96986b93be117c4f683517 +size 561076162 diff --git a/full_models/cto/G_100000.pth b/full_models/cto/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3b28974be23853346cbd968a42a80e02394eb43 --- /dev/null +++ b/full_models/cto/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a93da27ad2a054bcf9d6b858e8ed154c78b1525d1a2eaeb434ddd64eb4aad7d +size 436369227 diff --git a/full_models/cto/config.json b/full_models/cto/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/cto/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cto/vocab.txt b/full_models/cto/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a9d8378040ef230403a171d2f469be8d7f968687 --- /dev/null +++ b/full_models/cto/vocab.txt @@ -0,0 +1,42 @@ +a +| +r +b +e +' +i +ã +ʉ +m +d +u +w +z +t +s +k +n +o +ũ +j +ẽ +h +ĩ +̃ +p +y +g +c +ú +õ +l +ñ +í +é +f +ó +á +v +- +q + diff --git a/full_models/ctu/D_100000.pth b/full_models/ctu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8e553e521929702d863cda2dd3c6f0f9d20f7f3b --- /dev/null +++ b/full_models/ctu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c9d65d963f4a87b306d1a3c44ab54a17508c65870c5dffc44754e28e4ee4ec +size 561076204 diff --git a/full_models/ctu/G_100000.pth b/full_models/ctu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..37be97e200e55e89d8d81676e85cacff2b2a0aa5 --- /dev/null +++ b/full_models/ctu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3602b9da1d2d75430076450b4544252e49f0580a15c39bff0e7131f6188dbe3 +size 436358173 diff --git a/full_models/ctu/config.json b/full_models/ctu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ctu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ctu/vocab.txt b/full_models/ctu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9d2c49dc883de3a23d5093e00c682e788c4bdc3a --- /dev/null +++ b/full_models/ctu/vocab.txt @@ -0,0 +1,37 @@ +| +i +a +c +l +t +e +o +j +n +b +' +m +u +s +ʌ +h +y +ñ +p +w +q +x +r +d +ú +g +í +á +é +ó +f +z +v +ń +k + diff --git a/full_models/cuc/D_100000.pth b/full_models/cuc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7316ad2368ef8ce6edf2cd742461e3b60b55710f --- /dev/null +++ b/full_models/cuc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bffa0813ee875aa4bc6c2fb08da4d8081c23471da423f7ebb329505d1e10f8c +size 561078594 diff --git a/full_models/cuc/G_100000.pth b/full_models/cuc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4b890c40ce8dbc9cb5dea200983b41b9fab9c04d --- /dev/null +++ b/full_models/cuc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8eb0e6cd72f099c0ce64b9eb59e79e863181a05cfe1f5fd47e931b67b7b8888 +size 436382928 diff --git a/full_models/cuc/config.json b/full_models/cuc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cuc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cuc/vocab.txt b/full_models/cuc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2f87826e4c4aed7b0b4716477ffa1534d1dbf386 --- /dev/null +++ b/full_models/cuc/vocab.txt @@ -0,0 +1,40 @@ +| +3 +i +a +4 +n +h +2 +e +j +o +u +l +c +t +1 +s +m +ˉ +q +g +5 +ú +r +y +d +p +ñ +ŋ +b +í +á +f +é +ó +v +z +x +k + diff --git a/full_models/cui/D_100000.pth b/full_models/cui/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe8f07261bdf043bf3fe8d92734bc26fd7257ade --- /dev/null +++ b/full_models/cui/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d7cd4d2ee6635be22020ebc331f4b3d9137e905b29492b8768bc0fb0e4473c7 +size 561076191 diff --git a/full_models/cui/G_100000.pth b/full_models/cui/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e0c049d2d046328de1823b18221fa90f8cff5122 --- /dev/null +++ b/full_models/cui/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca2511604aadae84a809b0b65398519ea6ab1c5c9f184991a96124b4af55ee23 +size 436360120 diff --git a/full_models/cui/config.json b/full_models/cui/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cui/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cui/vocab.txt b/full_models/cui/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..275d4884f345cec465b4169b7b4f6eb40a1e15a4 --- /dev/null +++ b/full_models/cui/vocab.txt @@ -0,0 +1,38 @@ +a +é +ñ +e +i +u +z +í +j +r +w +o +' +n +s +— +f +y +t +c +ʉ + +d +l +ú +h +q +- +b +x +_ +ó +v +p +á +m +k +g diff --git a/full_models/cuk/D_100000.pth b/full_models/cuk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5f6430ba48450fb7fe98b58b9b2194465492784f --- /dev/null +++ b/full_models/cuk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a6ad59e6ac44a4ab98d5f65004726ce1b4d078be1f6fd7885857dcbbc0bc3df +size 561078741 diff --git a/full_models/cuk/G_100000.pth b/full_models/cuk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8f04a29842a31639b7965524404b347eb44aefc8 --- /dev/null +++ b/full_models/cuk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f7e3bbf38f14878d2b24f1216d368d31db954f32611bda9bc068da8bc4456c +size 436375095 diff --git a/full_models/cuk/config.json b/full_models/cuk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cuk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cuk/vocab.txt b/full_models/cuk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9adf6cfdc442aa9e48ca9af719cbe590d8ec3b37 --- /dev/null +++ b/full_models/cuk/vocab.txt @@ -0,0 +1,36 @@ +a +| +e +d +i +g +n +b +m +- +u +r +s +o +l +k +w +y +t +j +c +p +ú +h +é +— +f +í +ó +v +á +z +q +x +' + diff --git a/full_models/cul/D_100000.pth b/full_models/cul/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..84cd21e11a19846ea7e8bcb310db6380f21a86bf --- /dev/null +++ b/full_models/cul/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:422a8baccd8038d4cd3b05b2d1fff5a9200873cece7f271d5e06409b4dbd63ea +size 561076170 diff --git a/full_models/cul/G_100000.pth b/full_models/cul/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b77ab318dfc2720d414c92d77d8e02fc71089633 --- /dev/null +++ b/full_models/cul/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:717c2d57f83b681d0103069e2a92548cffdb9e73271fdb6ce5a3fca10c34c1e9 +size 436367306 diff --git a/full_models/cul/config.json b/full_models/cul/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cul/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cul/vocab.txt b/full_models/cul/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..110d3dcd92bc40e6d64492a1391e9432156340ce --- /dev/null +++ b/full_models/cul/vocab.txt @@ -0,0 +1,41 @@ +' +ʼ +k +n +ñ +f +m +7 +l +o +g +— +1 +6 +9 +s +p +5 +_ +b +ó +i +- +2 +a +3 +j +e +z +v +r +c +4 +0 + +q +t +8 +h +u +d diff --git a/full_models/cwa/D_100000.pth b/full_models/cwa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1106c803f33e3cfaf81075bfa3995b948a66bd8e --- /dev/null +++ b/full_models/cwa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:323fbf177132978565be26d15a63f35f5efa9d4cdf197ad750c9847110ef6d48 +size 561078872 diff --git a/full_models/cwa/G_100000.pth b/full_models/cwa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a2bbea505477c7ad51da3b327773d55555925c77 --- /dev/null +++ b/full_models/cwa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b1579f77363305e0db6c280f2b739464e4664761a87975c65ed940449a9fc9 +size 436357826 diff --git a/full_models/cwa/config.json b/full_models/cwa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cwa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cwa/vocab.txt b/full_models/cwa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..69a759c17dd70cd82523d1a20314ff16dc9db4c1 --- /dev/null +++ b/full_models/cwa/vocab.txt @@ -0,0 +1,28 @@ +n +s +k +u +t +b +f +v +i +d +p +_ +e +a +- +r +y +w +g +ú +m +j +c + +h +' +o +ʼ diff --git a/full_models/cwe/D_100000.pth b/full_models/cwe/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f951dceb89303d961a76b0477db31bf45233258d --- /dev/null +++ b/full_models/cwe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414cbb9f41ea23225c5c8dd053729639c209dd6874e266d6371413d6171dcf2b +size 561079393 diff --git a/full_models/cwe/G_100000.pth b/full_models/cwe/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5d5e26d964c7330b0bc38beecd0a0c5b1eec2da7 --- /dev/null +++ b/full_models/cwe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc5b83b06e937463e2bb5aba41d323be9d3ccfdb4a9cf58efca7caf3c3699ea +size 436366151 diff --git a/full_models/cwe/config.json b/full_models/cwe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cwe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cwe/vocab.txt b/full_models/cwe/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..34970450d5a0cd5c9a2072d1d93a3bdbaf437cd6 --- /dev/null +++ b/full_models/cwe/vocab.txt @@ -0,0 +1,31 @@ +2 +o + +f +s +a +j +u +- +h +3 +b +y +l +c +g +7 +e +' +m +v +k +0 +p +t +w +z +_ +i +n +d diff --git a/full_models/cwt/D_100000.pth b/full_models/cwt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8d60773afc3c2d8ed0c3b424ddb7cc8b9971061f --- /dev/null +++ b/full_models/cwt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49da63cb66e292cebec989f98f7c4e9465b032bfc4f438170db8f550cbdae567 +size 561078732 diff --git a/full_models/cwt/G_100000.pth b/full_models/cwt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f5e8a00bfcb40faf4fc57258b800772869bf52cb --- /dev/null +++ b/full_models/cwt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:377dd1da6eb52f59b439f0465a7e84dc2f82428cb08c5efb780caaf9c7845feb +size 436368973 diff --git a/full_models/cwt/config.json b/full_models/cwt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cwt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cwt/vocab.txt b/full_models/cwt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d2731a808e867301da4b2b1123869bb0cceef5d6 --- /dev/null +++ b/full_models/cwt/vocab.txt @@ -0,0 +1,33 @@ +| +a +e +i +n +u +k +o +t +b +r +m +h +y +s +' +ŋ +j +f +á +w +l +d +ñ +ú +í +é +- +g +̱ +p +ó + diff --git a/full_models/cya/D_100000.pth b/full_models/cya/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9d5b4667ac99f2b0af3043613d95745030a8920f --- /dev/null +++ b/full_models/cya/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d32f9a6c689c1c57be2e0fe45db9b8765f16cd9e04dc226e2acb0a4f39c12e5 +size 561078366 diff --git a/full_models/cya/G_100000.pth b/full_models/cya/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8032eb657ec952572ccd5560cb60417ed786b792 --- /dev/null +++ b/full_models/cya/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a76c0d4ea5b85ab8c825ac0b241eabc044fbab4168b7a49b0c9710f0e0ff9af3 +size 436376027 diff --git a/full_models/cya/config.json b/full_models/cya/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cya/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cya/vocab.txt b/full_models/cya/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2fceebd3db72f89679a50cd9dbf339d17429322d --- /dev/null +++ b/full_models/cya/vocab.txt @@ -0,0 +1,37 @@ +| +a +n +' +u +i +c +o +t +y +s +e +h +l +ñ +d +m +j +x +g +q +r +b +p +ú +— +í +é +f +v +ó +z +á +ü +k +- + diff --git a/full_models/cym/D_100000.pth b/full_models/cym/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2bb04259228e49dd2e69597ceb080786b106bba --- /dev/null +++ b/full_models/cym/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86071ea8e0aa5864631e02fe273eb1a47a91b64a0ab86fe31c110e4154256b86 +size 561110513 diff --git a/full_models/cym/G_100000.pth b/full_models/cym/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..25e8e87f19f5bfe877633e82b9661f2f6cbefdc2 --- /dev/null +++ b/full_models/cym/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2c652b72c2712e336fffd4a2b65881f2cfbcf503959cbb88f72788389fa611 +size 436624818 diff --git a/full_models/cym/config.json b/full_models/cym/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/cym/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/cym/vocab.txt b/full_models/cym/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..3fc8f1ca78eaabcec0a5f28bdd036ef32a417e54 --- /dev/null +++ b/full_models/cym/vocab.txt @@ -0,0 +1,40 @@ +n +d +ŷ +î +x +— +h +o +_ +s +ó + +u +- +r +' +g +a +ŵ +f +y +m +â +e +b +j +z +p +û +i +ï +l +c +ô +ö +ë +ê +w +á +t diff --git a/full_models/daa/D_100000.pth b/full_models/daa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d0a10cb61b0951265c7f9f5fb9d4418081c1ca53 --- /dev/null +++ b/full_models/daa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf11548d5f947761e855c456591bb9c9fb7c559fbd88ca8220b153cdf566cd6c +size 561078575 diff --git a/full_models/daa/G_100000.pth b/full_models/daa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..de3168a6df5a850d5ceae27c8c7e1ff1dc22354d --- /dev/null +++ b/full_models/daa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfeb84b35db3dea3a73a6fc38872f15fb2d05ff9a6c642e47be346a7957011c5 +size 436362085 diff --git a/full_models/daa/config.json b/full_models/daa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/daa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/daa/vocab.txt b/full_models/daa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2093ddcde86898c15649b68f2f56b845670d588d --- /dev/null +++ b/full_models/daa/vocab.txt @@ -0,0 +1,31 @@ +| +a +i +k +n +o +u +e +r +t +g +ŋ +y +m +s +b +l +d +ɗ +w +c +- +p +̰ +j +h +z +ɓ +ƴ +' + diff --git a/full_models/dah/D_100000.pth b/full_models/dah/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..54c7d0f100bec6fb542fd5a9d746cf4ee22263ff --- /dev/null +++ b/full_models/dah/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c864c64df378599f601131ec9974cda4e8186b04d08d30babcda28bb0b29474 +size 561078610 diff --git a/full_models/dah/G_100000.pth b/full_models/dah/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..59544c4789aac901474ec81dbe2d4fb6d9c0b876 --- /dev/null +++ b/full_models/dah/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e00466e16c0ae8496b5715a6dead0f5d29472dc6aba507818b17a639b183f58 +size 436373462 diff --git a/full_models/dah/config.json b/full_models/dah/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dah/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dah/vocab.txt b/full_models/dah/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c9f0573cbe5ffecfe775acb2bbefe1dcdb4cba60 --- /dev/null +++ b/full_models/dah/vocab.txt @@ -0,0 +1,36 @@ +e +h +– +g +w +k +5 +8 +- +4 +' +6 +t +1 +m +0 +f +i +2 +u +_ +s +b +7 +y +n +d +p + +a +3 +9 +ŋ +o +l +r diff --git a/full_models/dar/D_100000.pth b/full_models/dar/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c3606c8f7d8707c3196325949d8e29d8c825f00f --- /dev/null +++ b/full_models/dar/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7684d7dc9c68d38823c46730e85a0dbea44e151ec3e75d3a73df8b0130526b83 +size 561076028 diff --git a/full_models/dar/G_100000.pth b/full_models/dar/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dc95c8bdddc498f00945681dc74391a4c7b865a6 --- /dev/null +++ b/full_models/dar/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a81397a04f705cc24c0ddee70d2a409c690cd20786d5d918e7144dbe539d6393 +size 436354764 diff --git a/full_models/dar/config.json b/full_models/dar/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dar/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dar/vocab.txt b/full_models/dar/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b282c617d92350064a1560c20590e15d1e0c6ee9 --- /dev/null +++ b/full_models/dar/vocab.txt @@ -0,0 +1,36 @@ +ь +п +_ +б +о +ш +– +ф +м +р +ж +а +' + +н +к +ю +я +- +ъ +х +й +ч +с +г +л +з +ӏ +у +т +э +и +ц +в +е +д diff --git a/full_models/dbj/D_100000.pth b/full_models/dbj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eb691f8908887f06fc574fa56b0f59c233979896 --- /dev/null +++ b/full_models/dbj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f8bb66480343ec95c3b987407cff5667cec3a2d8308f7291b48a6d5728c9bf +size 561076147 diff --git a/full_models/dbj/G_100000.pth b/full_models/dbj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..beb258954a9b9239d6d29e7206c72422c8f7ac82 --- /dev/null +++ b/full_models/dbj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09e7ca3f542839f32d832333148c95a615f8ce25f29ecbe9214f77d13abeb8f +size 436334396 diff --git a/full_models/dbj/config.json b/full_models/dbj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dbj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dbj/vocab.txt b/full_models/dbj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e55d26e1c365da616c56c7544ff8f3c593630353 --- /dev/null +++ b/full_models/dbj/vocab.txt @@ -0,0 +1,27 @@ +' +b +l +y +f +c +n +o +i +_ +s +g +z +d +k +m +j +- +a + +p +u +e +t +r +h +w diff --git a/full_models/dbq/D_100000.pth b/full_models/dbq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1cb7ea73f0b92f9532eb924254ed5f7363affed1 --- /dev/null +++ b/full_models/dbq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb8094a17bf24eb2e6c5c8817f7704d01cd74adbaa452c5115b7f69a38d428a3 +size 561078477 diff --git a/full_models/dbq/G_100000.pth b/full_models/dbq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0610a28a90025a8210021c42c81d173ad54c25b6 --- /dev/null +++ b/full_models/dbq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e14eb852affbd97a28bd56cbcb2b791de9ed19cc4e5b4f6b3232800d6560117 +size 436366494 diff --git a/full_models/dbq/config.json b/full_models/dbq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dbq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dbq/vocab.txt b/full_models/dbq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4b482b32beb66b499cf357c25cb648bdafdb8e65 --- /dev/null +++ b/full_models/dbq/vocab.txt @@ -0,0 +1,33 @@ +k +é +á +_ +l +o +c +r +ɓ +ɗ +a +' +s +i +j +ú +z +g +ə +h +y + +m +n +e +v +p +b +t +d +f +w +u diff --git a/full_models/ddn/D_100000.pth b/full_models/ddn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..89801d64970be44e7dee1fbfa7acca4d2a79a1d1 --- /dev/null +++ b/full_models/ddn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a938d64935b1725bcdf17fb95baebbab533a0e4a58f81dcc4fe1d1f11d3b2e6a +size 561079477 diff --git a/full_models/ddn/G_100000.pth b/full_models/ddn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9a4aa7978894cb2adfeebfc88cb560ce2bd9ba2f --- /dev/null +++ b/full_models/ddn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e68f9406b9b1c5199a53ece2b1bbc45b4691fb80a2e7d533887954430fe459f +size 436380007 diff --git a/full_models/ddn/config.json b/full_models/ddn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ddn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ddn/vocab.txt b/full_models/ddn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c710a5ed3100dd8e6cbefff75c8b78941b126412 --- /dev/null +++ b/full_models/ddn/vocab.txt @@ -0,0 +1,36 @@ +g + +t +à +f +e +̀ +ɛ +ò +k +a +d +_ +z +m +w +c +h +ɑ +ŋ +ɔ +ã +n +u +̃ +b +p +l +j +á +i +r +y +o +s +ǹ diff --git a/full_models/ded/D_100000.pth b/full_models/ded/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9e63a0a3f41b2d0c13ab26840d42706539179fdd --- /dev/null +++ b/full_models/ded/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d640fad48e210d4aa7d792accb78f933f4cff60917357f8c82fed4e30a76aa3a +size 561079348 diff --git a/full_models/ded/G_100000.pth b/full_models/ded/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d1630e0eaa6bdacd685abd37cde449ee00406d2 --- /dev/null +++ b/full_models/ded/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8b5731a6db13f5bafa708b919fe8b3a50ef1d4f67411357f24855015f38821 +size 436378829 diff --git a/full_models/ded/config.json b/full_models/ded/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ded/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ded/vocab.txt b/full_models/ded/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cffabb035278daa4e921a9ab56414c1a5884145c --- /dev/null +++ b/full_models/ded/vocab.txt @@ -0,0 +1,36 @@ +k +8 +n +2 +5 +e +f +w +a +r +u +1 +_ +c +0 +h +b +3 +o +9 +i +g +d +' +6 +m +— +y +p +z +t +s +l +4 +7 + diff --git a/full_models/des/D_100000.pth b/full_models/des/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..26c7cdf1d786d7fbea8d17d5af3151306eb4ed9a --- /dev/null +++ b/full_models/des/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81713d7b5c7b91025dce8216a220f4dc5dcd281d9b2a2fd2392e3a52881b2f25 +size 561078707 diff --git a/full_models/des/G_100000.pth b/full_models/des/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf188f3a286b87e847d8828e9a35ba4dd08fb117 --- /dev/null +++ b/full_models/des/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e1b659574d623285f6f931e140be901bc3d3c9fb5ef229fe09ffed90f883f7f +size 436396618 diff --git a/full_models/des/config.json b/full_models/des/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/des/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/des/vocab.txt b/full_models/des/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d02ba53f1e672c3d3dde1a913d864260b87d93bc --- /dev/null +++ b/full_models/des/vocab.txt @@ -0,0 +1,46 @@ +| +r +a +e +i +ʉ +o +m +g +ã +u +p +ĩ +h +s +c +b +j +d +t +y +w +n +á +ñ +̃ +õ +q +ẽ +l +ũ +ó +í +é +f +v +ü +z +1 +ú +- +k +x +‐ +̱ + diff --git a/full_models/deu/D_100000.pth b/full_models/deu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..776b99cfad6ad65b942197a5ff02b54315e2b3eb --- /dev/null +++ b/full_models/deu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6affdd35744b4e887d5e6adaf976e559941f4abe43af429d7def43fe0bfae7b8 +size 561110506 diff --git a/full_models/deu/G_100000.pth b/full_models/deu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dcf614b5ada6d7a42203898fb98dc2d94c0443f1 --- /dev/null +++ b/full_models/deu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582ee558bef5498ef42e15e4930161ac016d2b3a37463eec250fca987a4c3a36 +size 436635092 diff --git a/full_models/deu/config.json b/full_models/deu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/deu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/deu/vocab.txt b/full_models/deu/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..fa431b6edba85e373134936bde1085c8a8305a77 --- /dev/null +++ b/full_models/deu/vocab.txt @@ -0,0 +1,45 @@ + +v +2 +q +g +- +f +1 +8 +a +h +4 +ö +3 +r +m +ä +l +n +t +ë +d +b +y +ß +o +u +_ +j +s +6 +5 +ï +c +i +ü +p +k +e +– +w +z +7 +x +0 diff --git a/full_models/dga/D_100000.pth b/full_models/dga/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c115ac0e9fdbfd571531938ecbe8c482622142b7 --- /dev/null +++ b/full_models/dga/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05246082f540538667532e4cad95af7a951f34d23ca57111bd72586f8c3c8e9e +size 561079002 diff --git a/full_models/dga/G_100000.pth b/full_models/dga/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3da00adefa0b283fdb3f5dc76cb8e01b4b331dcf --- /dev/null +++ b/full_models/dga/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c0b52e83dc7295b04da0c517045d44578effd4f20c1c5893669070f718c60f +size 436374747 diff --git a/full_models/dga/config.json b/full_models/dga/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dga/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dga/vocab.txt b/full_models/dga/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..964806cc9e691c46196b4830e4d50794bee8ae05 --- /dev/null +++ b/full_models/dga/vocab.txt @@ -0,0 +1,35 @@ +f +w +t +õ +ŋ +l +ɛ +' +g +o +v +k +d +n +ã +u +̃ +i +ɔ +e +z +h +p +y +ẽ +ĩ +b +_ +- +s +m +ũ + +r +a diff --git a/full_models/dgi/D_100000.pth b/full_models/dgi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..862fd9802ab6508e8e91735785c7315a7b001017 --- /dev/null +++ b/full_models/dgi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:229076a3cfc689f5f7bfd1c6fcb244d5c895feb6a0b7e0f990a49f33b9c495ea +size 561078887 diff --git a/full_models/dgi/G_100000.pth b/full_models/dgi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b74d5ead1162945ede586f3192a2c80a3e047338 --- /dev/null +++ b/full_models/dgi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f117a9bf57f975344e5c491013c8210e360344f06ccea8f754750c6298ef0c85 +size 436416481 diff --git a/full_models/dgi/config.json b/full_models/dgi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dgi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dgi/vocab.txt b/full_models/dgi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e0117e7f5893989b60b52ef1f8209f3a714abeaa --- /dev/null +++ b/full_models/dgi/vocab.txt @@ -0,0 +1,53 @@ +| +a +ɩ +n +ɛ +b +ʋ +r +t +l +e +w +m +y +ɔ +k +̃ +- +i +s +z +ã +p +u +o +d +ŋ +ƴ +' +f +c +́ +v +̀ +g +õ +ẽ +ũ +á +ú +ù +à +í +ɓ +h +j +é +ĩ +ì +ó +ò +è + diff --git a/full_models/dgk/D_100000.pth b/full_models/dgk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aa6ef41cbac1e4dea5dc03641be363e7ecddbaa6 --- /dev/null +++ b/full_models/dgk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64edc751ca1680267dd08c9f7bfdcc90996088e68cfdfe8a25deefe0c3d658fd +size 561079218 diff --git a/full_models/dgk/G_100000.pth b/full_models/dgk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02cd7c2eaa61c15ee6c587eda100f213f36c7399 --- /dev/null +++ b/full_models/dgk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c6cd9d307144932fd4e17973b26acd18623be288e7c43f44a62d053ee5de73e +size 436401660 diff --git a/full_models/dgk/config.json b/full_models/dgk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dgk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dgk/vocab.txt b/full_models/dgk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0895e12a58f9797444196a0e21f2ee8e6f271dbe --- /dev/null +++ b/full_models/dgk/vocab.txt @@ -0,0 +1,46 @@ +é +a +ә +u +ù +ḭ +g +r +d +̰ +t +j +m +p +h +ò +ì +í +ɔ +n +l +á +_ +ɓ +w +ú +ó +ɗ +' +́ + +ə +i +2 +k +s +- +ṵ +à +o +̀ +ŋ +y +b +ɛ +e diff --git a/full_models/dgo/D_100000.pth b/full_models/dgo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0afaac54bba51fe928ec621cc9b1d2e027b97371 --- /dev/null +++ b/full_models/dgo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f36539e325c0f888306d6fc2b1a30f229a8e7e85194a7bc8e484d714383cc8 +size 561079121 diff --git a/full_models/dgo/G_100000.pth b/full_models/dgo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..72d9fa81de8320cda371019ba66452443619d5e8 --- /dev/null +++ b/full_models/dgo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5cf794a3814294efe75f9a094598d1a01745b79ececc75d87cccff0f19fa38 +size 436442709 diff --git a/full_models/dgo/config.json b/full_models/dgo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dgo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dgo/vocab.txt b/full_models/dgo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f7f258aec288dbd80011af3b44e30f1a011cd3b0 --- /dev/null +++ b/full_models/dgo/vocab.txt @@ -0,0 +1,64 @@ +| +े +ा +न +र +क +द +ी +त +स +ं +् +ल +प +म +ि +य +ग +ज +ै +ु +ब +च +ओ +आ +ो +ई +ड +ख +उ +़ +ऐ +अ +ए +श +व +ह +थ +ू +ट +ऊ +छ +ँ +फ +ौ +इ +भ +ध +ठ +- +झ +ढ +ष +ण +औ +घ +ञ +ृ +ः +' +ॉ +‍ +4 + diff --git a/full_models/dgr/D_100000.pth b/full_models/dgr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c491bf49547132e376c762cad3e8e96719b0c58a --- /dev/null +++ b/full_models/dgr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd75a93722974a279a1672b4507bfeaba5ed4351712a22ea9102332131c5717 +size 561078578 diff --git a/full_models/dgr/G_100000.pth b/full_models/dgr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..222d29faf644c97ff828a35407e12a2377c6572c --- /dev/null +++ b/full_models/dgr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515eff88a8dd220373940b45c5eaa878462bfc82024390defa04363c5958c5a2 +size 436391870 diff --git a/full_models/dgr/config.json b/full_models/dgr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dgr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dgr/vocab.txt b/full_models/dgr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2100844c53b1282d9b87c592ef87cf286e8ad670 --- /dev/null +++ b/full_models/dgr/vocab.txt @@ -0,0 +1,44 @@ +g +- +q +v + +f +e +y +d +ì +ʔ +s +ɂ +ǫ +z +r +a +' +ę +w +o +ò +x +̨ +m +b +l +ą +h +p +n +į +k +è +c +u +ı +ł +̀ +_ +à +t +i +j diff --git a/full_models/dhi/D_100000.pth b/full_models/dhi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..537880fc56f346ef1a0a3dcfdc31629badb98d5e --- /dev/null +++ b/full_models/dhi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739f6a431d2d798a2ae99d9d67add74eb640fad7d0e6fc83d0c8fa059034da12 +size 561078884 diff --git a/full_models/dhi/G_100000.pth b/full_models/dhi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9de04733e4d7912324686548f52503b0dc6e33d2 --- /dev/null +++ b/full_models/dhi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f6de94f0a030e4c969f6d386a62fb32ee27821f98768f61294b35258b121e6 +size 436423330 diff --git a/full_models/dhi/config.json b/full_models/dhi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dhi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dhi/vocab.txt b/full_models/dhi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5b536657890e4fb3be1a964a63fd91142f1b1fed --- /dev/null +++ b/full_models/dhi/vocab.txt @@ -0,0 +1,56 @@ +ा +| +ि +क +े +् +ल +ो +ङ +ह +इ +स +न +र +त +प +ु +म +द +ब +य +ग +उ +व +ख +ज +अ +भ +आ +च +थ +ध +घ +‍ +ए +फ +ओ +ट +झ +- +ड +छ +ै +ठ +ँ +ढ +ौ +ृ +' +औ +ऐ +ण +श +़ +ं + diff --git a/full_models/did/D_100000.pth b/full_models/did/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f5c53b995f6333a6e99533d4e19189ab6c76f319 --- /dev/null +++ b/full_models/did/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e219da60f87733e72509982d2f9e985b5d66766de26a80a4c7926a893fad4c30 +size 561078745 diff --git a/full_models/did/G_100000.pth b/full_models/did/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..013b33cda647b59c0ab246ad9ed3ff62dae724c3 --- /dev/null +++ b/full_models/did/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e7ddc9ee3002677a8f468fc00dd7f2c5c6c6231c272aae6b9115bd127fb094 +size 436373864 diff --git a/full_models/did/config.json b/full_models/did/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/did/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/did/vocab.txt b/full_models/did/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bc193506e9cdfce726100fe6c5a9e6b8d6fc12e4 --- /dev/null +++ b/full_models/did/vocab.txt @@ -0,0 +1,35 @@ +i +v +- +ĩ +a + +ũ +d +ꞌ +c +1 +õ +e +k +s +6 +r +w +m +g +t +b +o +u +_ +ẽ +h +á +n +p +j +' +l +y +ú diff --git a/full_models/dig/D_100000.pth b/full_models/dig/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d0e25eda1adf2db3e54c546e77acc8f46e5ba2b2 --- /dev/null +++ b/full_models/dig/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88f26b8070bbf924ad8bf4b7a0ac1b818dd22a1da170b9b269131f795e3152a +size 561078872 diff --git a/full_models/dig/G_100000.pth b/full_models/dig/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91c980807eda74ac3a61684867a2ffe06edf7a35 --- /dev/null +++ b/full_models/dig/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:535c8d5c243c62746baf1d8927e746fa51c644d6e2ff9d90e9284241ebb629c5 +size 436367462 diff --git a/full_models/dig/config.json b/full_models/dig/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dig/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dig/vocab.txt b/full_models/dig/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4ba14c0bbd0e4bc71ab04d58cd3d365f209b5321 --- /dev/null +++ b/full_models/dig/vocab.txt @@ -0,0 +1,32 @@ +c +' +l +a +v +á +o +r +u +k +m +5 +d +ó +n +0 +j + +p +f +y +s +i +e +t +b +w +_ +g +- +z +h diff --git a/full_models/dik/D_100000.pth b/full_models/dik/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2a9fc02b6f4e8eb2917a1e8e11ab8cc915119d51 --- /dev/null +++ b/full_models/dik/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb4ea02b6de5d1f924f4c0ea5b8e0cb0b5741693b2b2872585060ef15bb9b2f +size 561079007 diff --git a/full_models/dik/G_100000.pth b/full_models/dik/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6d3faa0025fa728c53beefb0c86fda040ef11fc5 --- /dev/null +++ b/full_models/dik/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93c4ff022c3cc9b2f9fb191627fb26f015be31b82e6da6a52fb091b9cd0f79c5 +size 436369106 diff --git a/full_models/dik/config.json b/full_models/dik/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dik/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dik/vocab.txt b/full_models/dik/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..097c0c8fbc79c4a14a4f9b2334048b4a506f0ce9 --- /dev/null +++ b/full_models/dik/vocab.txt @@ -0,0 +1,33 @@ +| +k +a +n +i +c +e +u +t +ë +l +ï +ɔ +h +y +̈ +r +ɛ +o +b +m +ä +w +p +d +ŋ +ö +g +j +ɣ +' +- + diff --git a/full_models/dip/D_100000.pth b/full_models/dip/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b88b694bd8de75b5bc58ddde7c7091d60626f5e1 --- /dev/null +++ b/full_models/dip/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c5ef2fcd15d2ddb92603eaae88c2c2145e46bb29a3fafe3770586709d6430ab +size 561078741 diff --git a/full_models/dip/G_100000.pth b/full_models/dip/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ae9feecbde70c9e5ee175c802246bdea39fb38c6 --- /dev/null +++ b/full_models/dip/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9229d9d01d31a9e0a2d374efdc83bc14ffcf65bf106872980fb8e745728830b +size 436361585 diff --git a/full_models/dip/config.json b/full_models/dip/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dip/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dip/vocab.txt b/full_models/dip/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d596f19866f03f7d20a704e8dd5aa6e463f36840 --- /dev/null +++ b/full_models/dip/vocab.txt @@ -0,0 +1,29 @@ +| +e +i +k +a +n +u +t +c +ɔ +o +y +l +r +h +d +ɛ +m +b +w +p +ŋ +g +j +ɣ +ԑ +— +ı + diff --git a/full_models/div/D_100000.pth b/full_models/div/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4c40d91cf95e7e3967af81f03e036e24880996f0 --- /dev/null +++ b/full_models/div/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265eedf80affbd56223a3b19690e2ba363e32d6cb07671b41e81add82724aa99 +size 561076065 diff --git a/full_models/div/G_100000.pth b/full_models/div/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0e36521653a77d0cae91d90310ef76afb3fc6453 --- /dev/null +++ b/full_models/div/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c33e82680d8000579c9e20db106a2a10b9916d7c7808cc4160132677240dd7 +size 436394053 diff --git a/full_models/div/config.json b/full_models/div/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/div/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/div/vocab.txt b/full_models/div/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fc4ceb10967e5d2573de2c8f950f1f7d9ec9116a --- /dev/null +++ b/full_models/div/vocab.txt @@ -0,0 +1,53 @@ +| +ަ +ެ +އ +ް +ނ +ު +ި +ާ +ކ +ވ +ގ +މ +ރ +ހ +ީ +ތ +ދ +ފ +ބ +ސ +ލ +ށ +ޭ +ޮ +ޅ +ޔ +ޑ +ޫ +ޖ +ޙ +ޕ +ޯ +ޓ +ޤ +ޒ +ޢ +ޏ +ޗ +ޚ +ޝ +ޞ +ޣ +' +ޟ +ل +ޡ +ا +ه +ޛ +ޠ +ޘ + diff --git a/full_models/djk/D_100000.pth b/full_models/djk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2a4109c7527d953d33dde9d4d7f1af0729026665 --- /dev/null +++ b/full_models/djk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1879835b5c3e90e366488c3b4fecb03640a5ff822c491907ae85f4ace017653 +size 561078214 diff --git a/full_models/djk/G_100000.pth b/full_models/djk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7fabc6cb2f7cddd43bd59e3bdebcb2228ac82c15 --- /dev/null +++ b/full_models/djk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15e88b1b5c48287f0793509430bbc10b9e118b77cc9ea583ce1b5ede54d15a6 +size 436359600 diff --git a/full_models/djk/config.json b/full_models/djk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/djk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/djk/vocab.txt b/full_models/djk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d25be8558784fe9a326c68e8b0b83924997aa350 --- /dev/null +++ b/full_models/djk/vocab.txt @@ -0,0 +1,30 @@ +| +a +i +e +n +u +o +s +d +k +t +m +f +b +g +w +l +p +y +á +j +h +v +z +0 +1 +2 +- +r + diff --git a/full_models/dnj-dialect_blowowest/D_100000.pth b/full_models/dnj-dialect_blowowest/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9b7feb94dfe35fcab1ad1efbf04a2a93a2073faf --- /dev/null +++ b/full_models/dnj-dialect_blowowest/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca8111c6732fceec85aef8bbbc16a75922fefac56240ab6af99366c8502a123 +size 561078631 diff --git a/full_models/dnj-dialect_blowowest/G_100000.pth b/full_models/dnj-dialect_blowowest/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..39a0f890c8d1fb170f4dcee54493e6a3560f13c7 --- /dev/null +++ b/full_models/dnj-dialect_blowowest/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c645f1c97a777e2fb5f6ae63f2bac6d66a23886344e039047c8aa1e5ec64f4ff +size 436364335 diff --git a/full_models/dnj-dialect_blowowest/config.json b/full_models/dnj-dialect_blowowest/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dnj-dialect_blowowest/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dnj-dialect_blowowest/vocab.txt b/full_models/dnj-dialect_blowowest/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24a66b64914eb67863583c26b30d4a1807f296e7 --- /dev/null +++ b/full_models/dnj-dialect_blowowest/vocab.txt @@ -0,0 +1,32 @@ +| +‐ +a +' +ö +n +h +k +ë +d +ɛ +b +u +o +y +w +g +꞊ +ɔ +i +ü +l +p +m +s +z +t +e +f +v +r + diff --git a/full_models/dnj-dialect_gweetaawueast/D_100000.pth b/full_models/dnj-dialect_gweetaawueast/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4547d888e29c08ea3849d91bc4161490d3dd8651 --- /dev/null +++ b/full_models/dnj-dialect_gweetaawueast/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8e3cabac40d254794b2f96c6a21047de4bcc3e545353058058f33023e1cfadb +size 561076185 diff --git a/full_models/dnj-dialect_gweetaawueast/G_100000.pth b/full_models/dnj-dialect_gweetaawueast/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e07ba7ae79bcba2b60a46af7ac07268dca4fbd3b --- /dev/null +++ b/full_models/dnj-dialect_gweetaawueast/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54119c843d5f7be4aa3d5343a76ec53c045c29ae0314a6c3a68cf10b8b5f4719 +size 436355911 diff --git a/full_models/dnj-dialect_gweetaawueast/config.json b/full_models/dnj-dialect_gweetaawueast/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dnj-dialect_gweetaawueast/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dnj-dialect_gweetaawueast/vocab.txt b/full_models/dnj-dialect_gweetaawueast/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7be4199ff12b301ee61d8eefaa0c38c0d5ae28ea --- /dev/null +++ b/full_models/dnj-dialect_gweetaawueast/vocab.txt @@ -0,0 +1,36 @@ +| +‐ +a +' +h +n +ö +d +k +ɛ +b +y +g +ë +ɔ +w +o +i +꞊ +u +ü +m +s +p +t +ʋ +z +̈ +e +l +ɩ +f +r +v +1 + diff --git a/full_models/dnt/D_100000.pth b/full_models/dnt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ce0642a809a5f0cbdac11a4f2edeb29e018d4b2 --- /dev/null +++ b/full_models/dnt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3f65b8af2ea8eac11224c62162068664972943ce4925e1a064a87471b078aa +size 561076829 diff --git a/full_models/dnt/G_100000.pth b/full_models/dnt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..017a8d3b79665fb9b4426214615644e4c8a4221b --- /dev/null +++ b/full_models/dnt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ae2bcdded73dc458ee2aebb64480b60dda6ab996891db8cf74333c1c01049b +size 436378069 diff --git a/full_models/dnt/config.json b/full_models/dnt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dnt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dnt/vocab.txt b/full_models/dnt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7bca5cf47b072e70a79a857700e073068582f6e4 --- /dev/null +++ b/full_models/dnt/vocab.txt @@ -0,0 +1,38 @@ +| +a +e +i +k +o +n +h +g +t +l +u +m +s +r +b +w +d +y +p +' +- +f +0 +1 +7 +z +2 +4 +3 +j +5 +6 +9 +c +8 +v + diff --git a/full_models/dnw/D_100000.pth b/full_models/dnw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bb668ef0cc8539a261b5ef44dd258c3c6424faee --- /dev/null +++ b/full_models/dnw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b18bbfcd61bac2f629cf611ac0730dd065254f0e429a8edcfc487bc8172ce704 +size 561078632 diff --git a/full_models/dnw/G_100000.pth b/full_models/dnw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a687031d23a4c58caad4f838c0b8e45527fa75f4 --- /dev/null +++ b/full_models/dnw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a031e41b9401672d23399d0477f495293965d5f4721cadf6a4f043413ee9855 +size 436371374 diff --git a/full_models/dnw/config.json b/full_models/dnw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dnw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dnw/vocab.txt b/full_models/dnw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..54186845841745f9bfed4151ceec00a635985e57 --- /dev/null +++ b/full_models/dnw/vocab.txt @@ -0,0 +1,35 @@ +c +p +2 +0 +b +7 +l +6 +r +e +' +n +a +d +t +h +o +3 +9 +w + +_ +- +i +u +g +s +k +j +8 +4 +y +m +1 +5 diff --git a/full_models/dop/D_100000.pth b/full_models/dop/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0d8125bfbf0c30aa6abbeb13ee0b22cd37c3bba5 --- /dev/null +++ b/full_models/dop/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64df3c42f9a882a23ee5825132bcddeaf118956a8ec0da044ae2a54de69b5e81 +size 561078579 diff --git a/full_models/dop/G_100000.pth b/full_models/dop/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ea798adaa1476f3c036434f8ae774590455130fe --- /dev/null +++ b/full_models/dop/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:797af295b49bf282729312b98e05df3bbf50be17ee31e6475f1976111577407f +size 436371407 diff --git a/full_models/dop/config.json b/full_models/dop/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dop/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dop/vocab.txt b/full_models/dop/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fb57ecd148e2d2d845c4ca821e84f171b02ea364 --- /dev/null +++ b/full_models/dop/vocab.txt @@ -0,0 +1,35 @@ +| +a +t +ɩ +n +ɔ +ɛ +p +l +ʋ +ə +s +k +m +ɣ +i +́ +y +e +u +w +ŋ +á +- +o +h +c +f +ḿ +ń +ú +é +í +3 + diff --git a/full_models/dos/D_100000.pth b/full_models/dos/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..67ad5fccd56228c382863adae970357c7681967a --- /dev/null +++ b/full_models/dos/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e70c62ac998eeb7acb06d6771dfe03bde54fda6d3ad1e21694d70f640c0879 +size 561079132 diff --git a/full_models/dos/G_100000.pth b/full_models/dos/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..691346a271008c2a3d583bd7150164f7d509e587 --- /dev/null +++ b/full_models/dos/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6a4e30184b2d5bc124dad54804669f4257ba15e6412d71edb9cbde77314821 +size 436395627 diff --git a/full_models/dos/config.json b/full_models/dos/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dos/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dos/vocab.txt b/full_models/dos/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..83182645ba658ba7dc04fc0b4b62eb9685f5851a --- /dev/null +++ b/full_models/dos/vocab.txt @@ -0,0 +1,44 @@ +o +ɓ +v +w +ɛ +h +u +0 +à +1 +á +n + +́ +í +p +ĩ +s +ɩ +r +ʋ +k +i +ũ +ŋ +y +ɔ +ã +c +ʔ +ɗ +z +̀ +̃ +_ +m +e +a +b +d +f +g +l +t diff --git a/full_models/dsh/D_100000.pth b/full_models/dsh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e8c7787efb25aa1f6aea13362bf9be9e9743694 --- /dev/null +++ b/full_models/dsh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15482ee273c088ce592ab0dabfbaff267ab3672f4c7b17c9eee4a750ddc32109 +size 561078759 diff --git a/full_models/dsh/G_100000.pth b/full_models/dsh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5c09501e2978a20ff4947039f76bc999f674fcc8 --- /dev/null +++ b/full_models/dsh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae8a93623e75d02c71e9d50eb77a7d2885c8aca73666391b68507f2da2603862 +size 436385375 diff --git a/full_models/dsh/config.json b/full_models/dsh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dsh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dsh/vocab.txt b/full_models/dsh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..96bea12f4fa2d0a2b40aace6180b6007e533057c --- /dev/null +++ b/full_models/dsh/vocab.txt @@ -0,0 +1,40 @@ +k + +̶ +ó +ô +j +- +b +u +ʼ +_ +t +ˈ +o +r +w +â +l +đ +a +é +m +ê +v +' +î +h +f +á +ú +n +e +i +c +í +û +d +g +s +y diff --git a/full_models/dso/D_100000.pth b/full_models/dso/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f7d168b054ecab453f4bc20af825766b00362115 --- /dev/null +++ b/full_models/dso/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f9e7c958ce1915bba5fc43ade9e15dced53056c14f2b928b0d15279f252cbf +size 561076025 diff --git a/full_models/dso/G_100000.pth b/full_models/dso/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9ecd14899bbec5cfd1d2758c192fa76fdaa29a65 --- /dev/null +++ b/full_models/dso/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56a6441febceaf63f10240fb4bab066dc4391095aad55eed64380355fa2e6b01 +size 436347473 diff --git a/full_models/dso/config.json b/full_models/dso/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dso/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dso/vocab.txt b/full_models/dso/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..94513f03b6f4912aff4f02c7633beccd44d0ed3b --- /dev/null +++ b/full_models/dso/vocab.txt @@ -0,0 +1,33 @@ +୍ +ଡ +ପ +ଙ +ର +ଇ +ଅ +_ +ବ +ଲ +ଚ +ଁ +ଉ +ସ +ା +ନ +ଦ +ୟ +ଣ +ଗ +େ +ଆ + +ଜ +ଟ +‍ +ମ +ୁ +ି +ଏ +ଞ +କ +ତ diff --git a/full_models/dtp/D_100000.pth b/full_models/dtp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fdc7c31dbab9adc7bce55d2a3ccda8c52995a108 --- /dev/null +++ b/full_models/dtp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19a18f5e8fc80d0e6e72b24f73c3795512d0686bd7ce7c1a991ed16cc0a1e30f +size 561078603 diff --git a/full_models/dtp/G_100000.pth b/full_models/dtp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..de6a36bceab17d369a1eba273d81ade92640f185 --- /dev/null +++ b/full_models/dtp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07928b30836ae343bfddc0aba67f0f305ff43f66026c0a8a40d6ea2af70b963d +size 436364490 diff --git a/full_models/dtp/config.json b/full_models/dtp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dtp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dtp/vocab.txt b/full_models/dtp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..73443258e9e61f0ebc077e5409e03e78ee4fd6e4 --- /dev/null +++ b/full_models/dtp/vocab.txt @@ -0,0 +1,32 @@ +| +o +i +a +n +d +u +t +k +m +' +s +g +p +r +l +y +h +b +w +- +e +j +— +0 +4 +c +1 +6 +2 +3 + diff --git a/full_models/dts/D_100000.pth b/full_models/dts/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4b988efa6db42f81614565901ae75861544a3ee6 --- /dev/null +++ b/full_models/dts/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6208e006d64934f6e693c2978130456795b501ca9b7aee35f747097f2f9044e +size 561078857 diff --git a/full_models/dts/G_100000.pth b/full_models/dts/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c1845792110895b1bf893a4b75519c45b6b510c1 --- /dev/null +++ b/full_models/dts/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5779b3a53094bcd8abe3283df2c83f8ebd5091919be3e96024fdd901c262113b +size 436356844 diff --git a/full_models/dts/config.json b/full_models/dts/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dts/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dts/vocab.txt b/full_models/dts/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..86f2e9cb2f9554afab02bb76d1be4ac8631849d1 --- /dev/null +++ b/full_models/dts/vocab.txt @@ -0,0 +1,28 @@ +| +a +i +ɛ +n +u +ɔ +e +g +b +w +o +m +r +l +y +k +s +d +j +t +p +ŋ +ɲ +h +' +- + diff --git a/full_models/dug/D_100000.pth b/full_models/dug/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a9c1bc6e2f560bb2432c338b19b79061b673a350 --- /dev/null +++ b/full_models/dug/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51cdab62a5813e15b9b3092b85d61e23e654c8a8d11d564a6c32378991b7e5c4 +size 561078892 diff --git a/full_models/dug/G_100000.pth b/full_models/dug/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4a886651091629f99ac7b62cb2126ca2473243b8 --- /dev/null +++ b/full_models/dug/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e91fceaf4d0920ad4cf65dc22b113ff33d6e5aaa9948e8d25cf5ee14c51e8d +size 436362831 diff --git a/full_models/dug/config.json b/full_models/dug/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dug/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dug/vocab.txt b/full_models/dug/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1ae381fb00735b7d6bc5963811f636c8418f0608 --- /dev/null +++ b/full_models/dug/vocab.txt @@ -0,0 +1,30 @@ +a +| +i +u +n +m +e +o +k +h +w +l +r +y +d +g +t +s +z +' +c +b +p +v +j +á +f +- +6 + diff --git a/full_models/dwr/D_100000.pth b/full_models/dwr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2d8f09f4d566171a3523bf85b72a407ecd2fb443 --- /dev/null +++ b/full_models/dwr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc38da7a3b4b891ae11dc7cfa5d65344de19ab4f22e2a3b4f6d326801ed83a38 +size 561078351 diff --git a/full_models/dwr/G_100000.pth b/full_models/dwr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6e38056c9622174387c559ef00f9802085b99b7f --- /dev/null +++ b/full_models/dwr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:119631ed08d17161720cadbd82c85520b0d1173d2c8a1c1285a8b9bbc7999e9f +size 436359759 diff --git a/full_models/dwr/config.json b/full_models/dwr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dwr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dwr/vocab.txt b/full_models/dwr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..648c87cc2d13018c4afd536789d072ebd5686f9f --- /dev/null +++ b/full_models/dwr/vocab.txt @@ -0,0 +1,30 @@ +a +| +e +i +n +t +d +o +s +y +u +h +w +k +g +m +p +b +l +r +q +7 +x +c +z +f +' +j +- + diff --git a/full_models/dyi/D_100000.pth b/full_models/dyi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3cb4e66752d56e03df8ccf6f86373f62235bf927 --- /dev/null +++ b/full_models/dyi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980c01dfbc8d0d70eb3e1ed829e9a5230283f58200bfad78aac351214028c1dd +size 561078712 diff --git a/full_models/dyi/G_100000.pth b/full_models/dyi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a0f7b2d9013b6e4c0ada93e1fef542f7a255a2b3 --- /dev/null +++ b/full_models/dyi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce56ce4aadf03800a9a27ef210f1e2b78ea00d6705eb19b0b83380fa69594524 +size 436374203 diff --git a/full_models/dyi/config.json b/full_models/dyi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dyi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dyi/vocab.txt b/full_models/dyi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..637f829ba7f41a1aa7732954ace9a273f3e2b532 --- /dev/null +++ b/full_models/dyi/vocab.txt @@ -0,0 +1,36 @@ +| +a +n +i +e +ɛ +y +l +w +g +k +o +p +ɔ +r +m +u +t +s +ŋ +b +f +j +ì +z +h +d +è +à +c +' +v +ù +ò +̀ + diff --git a/full_models/dyo/D_100000.pth b/full_models/dyo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..599cf3276a9fedde4e9940066a1b1da04412d955 --- /dev/null +++ b/full_models/dyo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b43361c372646775a18363644783baf0f167579592bc729031da1b74b1df9257 +size 561078762 diff --git a/full_models/dyo/G_100000.pth b/full_models/dyo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..541de31be8bcafeb051d1c50c48fadee03fd4cd7 --- /dev/null +++ b/full_models/dyo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f381e2fa5382a10f06ec47ac08f80db8c5104a6dab00382476886df57018ac +size 436371384 diff --git a/full_models/dyo/config.json b/full_models/dyo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dyo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dyo/vocab.txt b/full_models/dyo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..59771e35fd0339238ad78e9327d2364f81c35e7f --- /dev/null +++ b/full_models/dyo/vocab.txt @@ -0,0 +1,34 @@ +a +| +i +u +n +m +e +k +o +t +b +l +j +r +d +y +s +f +á +p +ú +w +ŋ +g +ñ +c +í +' +é +h +ó +- +— + diff --git a/full_models/dyu/D_100000.pth b/full_models/dyu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..78547f3ccd2690225fda935714ba0e5a550dfafa --- /dev/null +++ b/full_models/dyu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1234cdddaf22ab8f71f65691d350ed151bfacc9acd4840e346407564025e9e4c +size 561078873 diff --git a/full_models/dyu/G_100000.pth b/full_models/dyu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..90dc36be17dbb27a404c00b77ee6654c7e5f6414 --- /dev/null +++ b/full_models/dyu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fc5ece1bfc8c9e735c684239a3c45b4e983a22753aa9e558b925e1f7c5c7ff +size 436367228 diff --git a/full_models/dyu/config.json b/full_models/dyu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dyu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dyu/vocab.txt b/full_models/dyu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..127dfe0490c8b49b308c280beb7600fbe0076c07 --- /dev/null +++ b/full_models/dyu/vocab.txt @@ -0,0 +1,32 @@ +t +y +b +u +j +ɲ +p +o +s +w +m +h +i +_ +' +l +f + +- +g +n +z +ɛ +a +k +ɔ +v +d +r +ŋ +e +c diff --git a/full_models/dzo/D_100000.pth b/full_models/dzo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7d9d24415c11c64a4d3374e7884c4f542668ad2b --- /dev/null +++ b/full_models/dzo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2deb8a998ead201d464b5358b9f9a99f3463c0faca1f4d1a448ae83dea792bcb +size 561109761 diff --git a/full_models/dzo/G_100000.pth b/full_models/dzo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c26dba1d9a8d8a327fd3bce550a52eb16c005c6e --- /dev/null +++ b/full_models/dzo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7785e9f37399cca7667f9c9c8602b6d017dd21432798400825918b89f3a1dbd +size 436659760 diff --git a/full_models/dzo/config.json b/full_models/dzo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/dzo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/dzo/vocab.txt b/full_models/dzo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..aaae0c25e048873ed18115d5cf1e78c517a37aad --- /dev/null +++ b/full_models/dzo/vocab.txt @@ -0,0 +1,58 @@ +་ +ི +ས +ག +ད +ོ +ུ +ེ +བ +ན +ང +མ +ལ +ར +འ +ྱ +ཁ +པ +ཅ +ཀ +ཡ +ཚ +ཟ +ྲ +ཨ +ཏ +ཆ +ཤ +ྦ +ྟ +ཐ +ཞ +ྐ +ཕ +ཱ +ཝ +ྒ +ླ +ྡ +ཉ +ྨ +ཙ +ཛ +ཧ +ྤ +ྩ +ྷ +ཇ +ྗ +ྔ +ྣ +ྙ +ྫ +ྕ +ྭ +ཌ +ཪ + diff --git a/full_models/eip/D_100000.pth b/full_models/eip/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..493fb9d2d52cdcf99d5ed5c21f57ceba3f7df0e9 --- /dev/null +++ b/full_models/eip/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9ac0c55f47d0a11fcb9be33a3a66e03cd24ca8d0543424e255629c2598e531 +size 561076163 diff --git a/full_models/eip/G_100000.pth b/full_models/eip/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..099794e6c772f00ca7c6df1198f5daabcab9cf5f --- /dev/null +++ b/full_models/eip/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d59268b3eb406ac2c877c3b2142546cefe94d43d52dbb462366758282ef4d59 +size 436360120 diff --git a/full_models/eip/config.json b/full_models/eip/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/eip/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/eip/vocab.txt b/full_models/eip/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..495a497789dccfc04976bb3903787daf0a3ca7fb --- /dev/null +++ b/full_models/eip/vocab.txt @@ -0,0 +1,38 @@ +x +c +g +n +j +f + +s +6 +w +h +5 +9 +r +2 +' +o +d +8 +0 +i +k +1 +a +3 +p +l +m +z +y +b +- +_ +t +4 +u +e +7 diff --git a/full_models/eka/D_100000.pth b/full_models/eka/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..357fe32d1b66fc2854990e6679638528eb2c60dd --- /dev/null +++ b/full_models/eka/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:587c4b84edb1d6704740cdaec593876ff0e297594aeca496e2b11868c087b19e +size 561078749 diff --git a/full_models/eka/G_100000.pth b/full_models/eka/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e46da2bb912e4bbdf6b3394c4a4687c05c33b4f --- /dev/null +++ b/full_models/eka/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba9d3bddbee47a92123b4ae764e3bedb4d7e69d9c4f4fe028852bd7de4e362c +size 436360399 diff --git a/full_models/eka/config.json b/full_models/eka/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/eka/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/eka/vocab.txt b/full_models/eka/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5ac04106fa85272d568c7a8ca9c8ab53db5cb1c3 --- /dev/null +++ b/full_models/eka/vocab.txt @@ -0,0 +1,29 @@ +f +o +s +n +ḿ +m +p +i +d +ń +e +w +- +v +j +u +' +k +y +g +r +á +b +h +l +t +a +_ + diff --git a/full_models/ell/D_100000.pth b/full_models/ell/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a3509672f011ecf383685844b04c39d4b56e75b7 --- /dev/null +++ b/full_models/ell/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f29a67389a831eb315dadce35271b3d86b496de6e4eafc0c93efbc7e6af3c2b +size 561110632 diff --git a/full_models/ell/G_100000.pth b/full_models/ell/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b6b5481a421d52f31f1fb33bb68ad297d29c59a6 --- /dev/null +++ b/full_models/ell/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb87a5e4c82d73614465c9378a29a63a89ed5eb28a7c2de57cb829642306eb77 +size 436680169 diff --git a/full_models/ell/config.json b/full_models/ell/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ell/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ell/vocab.txt b/full_models/ell/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..f7b8fe0a3ec8a7c8066ced4de9be87bd6b94a24e --- /dev/null +++ b/full_models/ell/vocab.txt @@ -0,0 +1,64 @@ +b +1 +ή +p +5 +θ +ί +i +x +δ +ά +λ +7 +- +φ +π +ω +' +ϊ +k +ό +ψ +n +t + +y +τ +a +4 +β +â +κ +9 +γ +ξ +8 +χ +ε +h +ν +ζ +z +η +m +o +2 +6 +3 +e +υ +ώ +ϋ +έ +σ +ι +μ +α +ο +_ +ύ +0 +ς +ρ +ΐ diff --git a/full_models/emp/D_100000.pth b/full_models/emp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..769b3f73c2b67c1360a154029d4149ba70d14f3e --- /dev/null +++ b/full_models/emp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d154a64742c33e12d1f6d6013879cc7bf1463a00285f6b05fd994f7ebdcb2628 +size 561110026 diff --git a/full_models/emp/G_100000.pth b/full_models/emp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b3ba1d45e5571f022293cdd13ce903caf551d766 --- /dev/null +++ b/full_models/emp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4baf5a6990e80220b1bf97dc4a748c3543689eafae890f9d530f5fca2050c7 +size 436660940 diff --git a/full_models/emp/config.json b/full_models/emp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/emp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/emp/vocab.txt b/full_models/emp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..504f65560422f94b7886be2b005c75b84e1e0bf3 --- /dev/null +++ b/full_models/emp/vocab.txt @@ -0,0 +1,57 @@ +a +| +r +i +b +e +â +d +j +ö +ô +u +c +m +n +o +õ +s +å +w +ó +p +é +t +ì +q +ï +y +ã +z +g +h +l +– +è +ò +v +ä +á +ð +ú +ë +4 +9 +0 +2 +1 +6 +5 +x +ñ +3 +8 +7 +k +- + diff --git a/full_models/enb/D_100000.pth b/full_models/enb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..43493e1195db46476933e15aa01724244a2449ce --- /dev/null +++ b/full_models/enb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93078bd99c70297167ead96306eb8b0dbcd66c27f65253f9b68ed84cefcd3a06 +size 561109582 diff --git a/full_models/enb/G_100000.pth b/full_models/enb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..80e1007fe84ba1c10b57d67b34715de9b0605c49 --- /dev/null +++ b/full_models/enb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:501ab62f7894965952d23a0541b1974a298b9d951fee5d54d3ee36a73c5e9a06 +size 436597510 diff --git a/full_models/enb/config.json b/full_models/enb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/enb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/enb/vocab.txt b/full_models/enb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b704d654cb7461d446682bc3129255a846956d30 --- /dev/null +++ b/full_models/enb/vocab.txt @@ -0,0 +1,31 @@ +| +i +k +o +ē +a +n +u +y +ō +t +r +c +h +p +e +m +ā +l +w +s +g +ʼ +- +' +0 +1 +2 +6 +4 + diff --git a/full_models/eng/D_100000.pth b/full_models/eng/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..557198003b17c214efb457b36dda4005658da941 --- /dev/null +++ b/full_models/eng/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b1d7a2726b3cb27c18604ace828556d9c17c09f65eb041f690a89c99d7aea4 +size 561110135 diff --git a/full_models/eng/G_100000.pth b/full_models/eng/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f379208af40e047a7c995eb3d10d5be33f946b6 --- /dev/null +++ b/full_models/eng/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d276cee0f8291de23c8ed4f4a2ed15e3e4cff7b2d6af43660cd6b5e6e1149110 +size 436618116 diff --git a/full_models/eng/config.json b/full_models/eng/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/eng/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/eng/vocab.txt b/full_models/eng/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..9290e22c452c95c744390cdbd8bd13a4c1785622 --- /dev/null +++ b/full_models/eng/vocab.txt @@ -0,0 +1,38 @@ +k +' +z +y +u +d +h +e +s +w +– +3 +c +p +- +1 +j +m +i + +f +l +o +0 +b +r +a +4 +2 +n +_ +x +v +t +q +5 +6 +g diff --git a/full_models/enx/D_100000.pth b/full_models/enx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ec809cdc76da2b3b06c2eaa6568881ee454d207 --- /dev/null +++ b/full_models/enx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:294af76d2b6c3d8f7a1de679ec3f40e56c91c780a087b5ea00e4aba37c107813 +size 561078578 diff --git a/full_models/enx/G_100000.pth b/full_models/enx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9b46fd9644f5a22cbeb309f3a7dea6b668143d21 --- /dev/null +++ b/full_models/enx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccdd2e5eb0b4baf10269a8d18dd48f76517f44b4eabf4affabef91e00b7790fc +size 436380316 diff --git a/full_models/enx/config.json b/full_models/enx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/enx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/enx/vocab.txt b/full_models/enx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0b96990aad72841f10671537e7802e3ca8402661 --- /dev/null +++ b/full_models/enx/vocab.txt @@ -0,0 +1,39 @@ +ú +é +ẽ +— +w +y +à +a +m +z +v +n +í +i +l +ñ +u +g +r +' +f +h +e +o +t +b +q +x +p +è +s +á +d +j + +k +c +_ +ó diff --git a/full_models/ese/D_100000.pth b/full_models/ese/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..444f7310b219f519459b9b8ecd8bb57e5e8539e3 --- /dev/null +++ b/full_models/ese/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2597480ae4a5a5c43cbf0e66a52be889d76a5ec8a79463eae74f5fd8d6add8 +size 561076247 diff --git a/full_models/ese/G_100000.pth b/full_models/ese/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c1d2266608ba3ae6f0daa37b2c0c56b0f5a976fc --- /dev/null +++ b/full_models/ese/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a1a5d344b941d34b4f601071780c4b3cae850a5a4eb0cef877194f826e80b7 +size 436378983 diff --git a/full_models/ese/config.json b/full_models/ese/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ese/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ese/vocab.txt b/full_models/ese/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..09ea7ff9265bb5978050d8be5cd15cf58757b860 --- /dev/null +++ b/full_models/ese/vocab.txt @@ -0,0 +1,46 @@ +a +| +j +e +i +o +u +n +c +m +y +h +p +q +s +b +' +t +ñ +- +d +r +l +— +g +í +é +v +f +0 +á +z +ó +1 +2 +4 +5 +ú +x +6 +3 +9 +7 +k +8 + diff --git a/full_models/ess/D_100000.pth b/full_models/ess/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..00e2ad57ad8286e97dd5856219b42f3791d750ff --- /dev/null +++ b/full_models/ess/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6423fcba2a002a207b0507a64de51bbfab106fd7840bdbd81e3f89ca08476f71 +size 561078626 diff --git a/full_models/ess/G_100000.pth b/full_models/ess/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82b635398f938f5d68c0e7ffcc6d7b4994b27e1d --- /dev/null +++ b/full_models/ess/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e627c67111a513cb1f8dd01eff88ba42e6ea015601cf002ca80868bcd61707a +size 436391818 diff --git a/full_models/ess/config.json b/full_models/ess/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ess/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ess/vocab.txt b/full_models/ess/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d13f89dd70c6b9f9764d3143873ad028bc068cfd --- /dev/null +++ b/full_models/ess/vocab.txt @@ -0,0 +1,43 @@ + +c +1 +s +0 +f +8 +v +2 +x +_ +w +g +m +l +3 +‐ +9 +q +i +e +u +ʼ +j +d +b +r +y +n +z +5 +' +- +6 +ꞌ +7 +k +a +4 +p +h +o +t diff --git a/full_models/eus/D_100000.pth b/full_models/eus/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4fc4fb4f17b0f3b9699f6886b7c9bbdf55594046 --- /dev/null +++ b/full_models/eus/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43423b5658548a0edc686816bc02624d4a5067a7d98dec24a8704cd70e5ce40e +size 561079233 diff --git a/full_models/eus/G_100000.pth b/full_models/eus/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b719a1d120c3a2dd99e1ae1dccc34c658e00728 --- /dev/null +++ b/full_models/eus/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff9b8674548b0033bbcef25afa8f69d3cebd837ef846064a11b380c9924ec2d +size 436355735 diff --git a/full_models/eus/config.json b/full_models/eus/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/eus/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/eus/vocab.txt b/full_models/eus/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..74fb1bb1fb18c25ca1cf73b0c9ba3b17b86be79f --- /dev/null +++ b/full_models/eus/vocab.txt @@ -0,0 +1,26 @@ +b +— +o + +s +u +p +_ +f +r +x +a +h +t +l +g +e +m +v +k +j +n +d +i +z +- diff --git a/full_models/evn/D_100000.pth b/full_models/evn/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..139fbd51e26640beb1627d0897c32d36937ca5dd --- /dev/null +++ b/full_models/evn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ddf279750ad6190a69e6f773c66a2a5965948e2e916900c47e09985879028d +size 561076160 diff --git a/full_models/evn/G_100000.pth b/full_models/evn/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..be2ca03967f6a5355dbaa874c2cb003824883dbf --- /dev/null +++ b/full_models/evn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1aa4fa4bfc3b83534b8207827917e9891185a646904713c81efcafce583784b +size 436360109 diff --git a/full_models/evn/config.json b/full_models/evn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/evn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/evn/vocab.txt b/full_models/evn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..86ee78238513b1435180503fbdf198314e30b97a --- /dev/null +++ b/full_models/evn/vocab.txt @@ -0,0 +1,38 @@ +| +н +э +а +у +д +л +и +т +к +р +ӣ +в +м +с +ӯ +ч +г +ӈ +б +е +ы +х +о +- +я +– +п +ё +ю +й +ф +ь +ъ +ц +ш +з + diff --git a/full_models/ewe/D_100000.pth b/full_models/ewe/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5327d77d2134fef8369e61f25d31414a5674ecae --- /dev/null +++ b/full_models/ewe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2364658e91f0bd0b842289be52f321911e20d497dcae430e3818c49c2754ad9 +size 561078870 diff --git a/full_models/ewe/G_100000.pth b/full_models/ewe/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8bc8db76c293d98d8473ed5cd3bcd1e1fda34f13 --- /dev/null +++ b/full_models/ewe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21be182b3943994ccd334eba2cced2e82fbf46b87e4069602df757795121a58 +size 436411100 diff --git a/full_models/ewe/config.json b/full_models/ewe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ewe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ewe/vocab.txt b/full_models/ewe/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..853565eb9ef5cc5ab390edcaa2454779fca24151 --- /dev/null +++ b/full_models/ewe/vocab.txt @@ -0,0 +1,51 @@ +r +w +a +l +g +ɣ +k +̀ +b +n +ŋ +x +d +á + +ù +s +o +p +ɖ +í +ƒ +z +ɔ +_ +̃ +i +à +ũ +v +h +ã +y +ʋ +- +́ +ɛ +è +ú +e +t +ó +m +ì +é +ò +f +' +ẽ +u +ĩ diff --git a/full_models/eza/D_100000.pth b/full_models/eza/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5bf17d3b11c7270510c0d8a51c5c50b8a2b25c37 --- /dev/null +++ b/full_models/eza/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67a26f7e02e4f5b788f9c6e5c000247aa09ae37ec6bde4deb819f0aea638a8ac +size 561078603 diff --git a/full_models/eza/G_100000.pth b/full_models/eza/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b2ac66f8da183df7a6f4e069d6211d350c3d499 --- /dev/null +++ b/full_models/eza/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ab3cb8c042a9237fe31e89600de593b8f195af5a50860d84aefbd6d795d1a9 +size 436394321 diff --git a/full_models/eza/config.json b/full_models/eza/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/eza/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/eza/vocab.txt b/full_models/eza/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e081436818ce598c2679b205d2834f2fd01f87b7 --- /dev/null +++ b/full_models/eza/vocab.txt @@ -0,0 +1,45 @@ +_ +à +h +n +̀ +í +ò +é +y +ụ +i +u +á +g +a +s +ẹ +ù +c +è +j +z +ó +ị + +ì +d +f +- +ú +b +ọ +m +l +6 +p +' +e +o +r +w +k +v +t +́ diff --git a/full_models/fal/D_100000.pth b/full_models/fal/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f315ca3525ee4b5953fdb1412cd4303b2bd1b9a1 --- /dev/null +++ b/full_models/fal/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6aff22d8a7ffa5661a5b5cb6545529688654b84756f9b265496a2df576a299 +size 561110225 diff --git a/full_models/fal/G_100000.pth b/full_models/fal/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed105166719b48e2f2b7e951518d9f8a3212c821 --- /dev/null +++ b/full_models/fal/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554b71d3a5ab81fa08d8c957215af54e5c28695f76416aa2f25293346f543a96 +size 436615750 diff --git a/full_models/fal/config.json b/full_models/fal/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fal/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fal/vocab.txt b/full_models/fal/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..51dcb592bfe5ce94927773106e181425e6dfc0a8 --- /dev/null +++ b/full_models/fal/vocab.txt @@ -0,0 +1,38 @@ +| +a +i +n +e +y +r +m +g +t +u +k +o +w +à +d +s +â +è +b +j +l +p +h +f +î +c +ò +ɗ +û +' +ɓ +- +ê +ù +1 +v + diff --git a/full_models/fao/D_100000.pth b/full_models/fao/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f88d7668d40e849a471e02ecd6c88672f7ce8d55 --- /dev/null +++ b/full_models/fao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9cad228eb976f62d1d6e59b51c4de0f50858d4e2efd62615c36d57474d944e4 +size 561078886 diff --git a/full_models/fao/G_100000.pth b/full_models/fao/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dede67dfcd2949937ce23cebc826686d758bf867 --- /dev/null +++ b/full_models/fao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0f450a085518cda3de9b75b72dd11c70a259fd2eb385f57f0eeca44afb25dd +size 436379264 diff --git a/full_models/fao/config.json b/full_models/fao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fao/vocab.txt b/full_models/fao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4a69847d415993a9264dbb91afea8dbce413ad5a --- /dev/null +++ b/full_models/fao/vocab.txt @@ -0,0 +1,37 @@ + +z +i +h +m +r +u +k +s +d +v +f +ó +b +– +p +í +e +j +- +y +ø +l +1 +æ +a +o +ú +ð +ý +4 +n +_ +t +7 +á +g diff --git a/full_models/far/D_100000.pth b/full_models/far/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..047907db0922d041805dddea135a4f849b1332a1 --- /dev/null +++ b/full_models/far/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7088e05f75aa3d708c2f54a5053b95593ef6727dbabf044c04b87e0c85a5fd3 +size 561078745 diff --git a/full_models/far/G_100000.pth b/full_models/far/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3dae49ce7db2f79c508e0854f9d022f425033f7a --- /dev/null +++ b/full_models/far/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08fe6cb3f3169c0f8c5ca8bf45a1d45938602691b0f5b56e20a710adc1d8dae0 +size 436354930 diff --git a/full_models/far/config.json b/full_models/far/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/far/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/far/vocab.txt b/full_models/far/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..73d179dc0f8861206b6cdbf4d8ba1c52482ce4dd --- /dev/null +++ b/full_models/far/vocab.txt @@ -0,0 +1,27 @@ +b +h +d +p +g +' +c +w +l +n +s +_ +6 +e +o +t +y +f +r +v +i +a +j +u + +k +m diff --git a/full_models/fas/D_100000.pth b/full_models/fas/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f6a8d12468c338884ede89e9fdb4aa785ef463a --- /dev/null +++ b/full_models/fas/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba20854f5c38c5e425233fc063d1485cdc3c020a2f50ae220943c820efc0d12f +size 561078869 diff --git a/full_models/fas/G_100000.pth b/full_models/fas/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..e3051a62df7c2b84dba56429bcbd3afa51e2d6c4 --- /dev/null +++ b/full_models/fas/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f74189891ddae7e5d26a43c6c49ccbe93fb31fd5ef90a3670168be73107daf10 +size 436396990 diff --git a/full_models/fas/config.json b/full_models/fas/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fas/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fas/vocab.txt b/full_models/fas/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ea255d24a66c2e529f3f399d5d0e3191902e52b2 --- /dev/null +++ b/full_models/fas/vocab.txt @@ -0,0 +1,44 @@ +ل +پ +ع +أ +ئ +ذ +_ +ك +ج +ر +ه +ف +گ +ي +ء +ی +ص +ق +ح +ط +ث +ٔ +ن +م +ظ +ت +ب +و +د +غ + +ش +خ +ک +آ +- +ؤ +چ +ژ +س +' +ا +ض +ز diff --git a/full_models/fij/D_100000.pth b/full_models/fij/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..47bf0bd7d52cf48177c6793edf1a89ab737fc201 --- /dev/null +++ b/full_models/fij/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c1b1c4d246078d4d0e3961fcbda49d7f0f2295208930e0821d6d8b3a9ff48c +size 561109738 diff --git a/full_models/fij/G_100000.pth b/full_models/fij/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d05c29d67847dfbd68e5db0581c6339a55b1ab7f --- /dev/null +++ b/full_models/fij/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b57374d2ca2a76ad5f6d05288ad995c0bdce606882ca36951bc25168b179db3 +size 436609085 diff --git a/full_models/fij/config.json b/full_models/fij/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fij/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fij/vocab.txt b/full_models/fij/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..66e865d76ef80708cc834c094aa7b43048835b3c --- /dev/null +++ b/full_models/fij/vocab.txt @@ -0,0 +1,36 @@ +| +a +i +k +n +e +u +o +v +t +s +l +r +m +d +g +y +c +q +b +w +p +j +' +f +ʻ +ʼ +- +0 +2 +1 +— +3 +5 +4 + diff --git a/full_models/fin/D_100000.pth b/full_models/fin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..73f966c6cad3405d7c3184855eb50209913a179c --- /dev/null +++ b/full_models/fin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2a84b5d45bfd82e09b96b3486bedcc17c363565e3b31501ce78a19e4c1ba55c +size 561110240 diff --git a/full_models/fin/G_100000.pth b/full_models/fin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8bab611303bb0c914578cbdcc280fac33b53a7ce --- /dev/null +++ b/full_models/fin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463dcf58e2aa488ae253674f0296dbd972ee968cc40b3b9928da72bb68dc7f40 +size 436596134 diff --git a/full_models/fin/config.json b/full_models/fin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fin/vocab.txt b/full_models/fin/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..68e5a7d851b15f888720851e0c7630235d98f663 --- /dev/null +++ b/full_models/fin/vocab.txt @@ -0,0 +1,28 @@ +p +g +j +v +y +z +s +ä +b +- +m +h +t + +r +f +' +_ +l +ö +u +n +a +k +d +o +e +i diff --git a/full_models/flr/D_100000.pth b/full_models/flr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f86414f632973a4bac77807fac221006e567e365 --- /dev/null +++ b/full_models/flr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a55cf6524ee8071464f1984dae672b2f8a604444f3e9cc065813da653abd97a +size 561078963 diff --git a/full_models/flr/G_100000.pth b/full_models/flr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b6bb185d8bd75c6faf049bb57be40ec4d7ddd92 --- /dev/null +++ b/full_models/flr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1159cb3ec51830db3672347378fb735f76a6e64144b9cc2a768fcf11da97c44f +size 436368438 diff --git a/full_models/flr/config.json b/full_models/flr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/flr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/flr/vocab.txt b/full_models/flr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a8bd516c1d04925f2ec2bf10a45b62e7fbb6f965 --- /dev/null +++ b/full_models/flr/vocab.txt @@ -0,0 +1,32 @@ +f +ꞌ +â +p +e +ù +n +h +ú +d +w +l +_ + +k +j +z +r +í +y +u +o +g +- +m +t +s +i +b +v +a +á diff --git a/full_models/fmu/D_100000.pth b/full_models/fmu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7bafd868ba9257eeb01e196a6d02e51287c7ae76 --- /dev/null +++ b/full_models/fmu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e83182d3397bb6bca71920516d1a215d30056ba58d6c41c4e120cd5cf0acfe +size 561076147 diff --git a/full_models/fmu/G_100000.pth b/full_models/fmu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ccfcb466985eca90ddaff3fd4ed9e1994e9613e8 --- /dev/null +++ b/full_models/fmu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6578ef67aa4c2a5d012b8123b27df6dc9d56e35f4e4be32e114eb4115b48cfc +size 436387492 diff --git a/full_models/fmu/config.json b/full_models/fmu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fmu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fmu/vocab.txt b/full_models/fmu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..455f3fd6854670c5498ead11abf15775d6976a2c --- /dev/null +++ b/full_models/fmu/vocab.txt @@ -0,0 +1,50 @@ +ऊ +स +‍ +ि +़ +ी +ओ +य +ळ +अ +घ +ै +_ +इ +ड +ए +ब +म +ू +ल +1 +च +ा +ो +ह +ण +' +श +आ +द +उ +क +प +ज +् +ट +ष +- +ु +े +व +त +ग +भ +ध +ं +न + +ख +र diff --git a/full_models/fon/D_100000.pth b/full_models/fon/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f1388b6dff3fad863fbf47ec24ae4ba1cb8461e0 --- /dev/null +++ b/full_models/fon/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a47f7c790bc57412757d46e3614a352884ca2187ffad1828e0a7b6762dd14c +size 561078887 diff --git a/full_models/fon/G_100000.pth b/full_models/fon/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ecb79ed71c831a45119447030916b6d5923d0a64 --- /dev/null +++ b/full_models/fon/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4760e107c35d99f627910a747271a6cc92f4f1b95e261a79be173a4922f0c92 +size 436399589 diff --git a/full_models/fon/config.json b/full_models/fon/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fon/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fon/vocab.txt b/full_models/fon/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..defe146a04635911d072f2511fe725b605fc92e9 --- /dev/null +++ b/full_models/fon/vocab.txt @@ -0,0 +1,46 @@ +_ +è +ɖ +̌ +ǐ +t +d +- +f +e +ó +ú +é +v +ǎ +g +' + +s +ǔ +k +́ +a +n +h +i +í +b +u +p +m +á +j +đ +l +ǒ +x +ɔ +z +y +c +o +w +ì +ě +ɛ diff --git a/full_models/fra/D_100000.pth b/full_models/fra/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..af994b36a1a483d72778c0769d41dbc92af51b8c --- /dev/null +++ b/full_models/fra/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82b5164f0c3cb5a6495d574fe7bf1cbccda3722631b6c966a29902b970d0fd2 +size 561110144 diff --git a/full_models/fra/G_100000.pth b/full_models/fra/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..41b71b8063bb07597799564c345eae59906e95fe --- /dev/null +++ b/full_models/fra/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd4be5a43467c25e5eab0aacfe150db56b58c963673b7a619ffe5b29d796d25 +size 436630929 diff --git a/full_models/fra/config.json b/full_models/fra/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/fra/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/fra/vocab.txt b/full_models/fra/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..54bbe0753eef3fdc5fd52938e68cb9f3ecb209a6 --- /dev/null +++ b/full_models/fra/vocab.txt @@ -0,0 +1,44 @@ +î +z +- +ù +u +û +y +è +x +q +c +g +ô +ê +_ +e +i +d +b +a +f +œ +h +r +é +k +s +v +à + +– +p +ë +t +n +o +j +ü +â +ç +ï +' +m +l diff --git a/full_models/frd/D_100000.pth b/full_models/frd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d04f076ad3080e7f64a483fb3fe69fddab01915a --- /dev/null +++ b/full_models/frd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ccbe79ac48b26d10351c94b88cd1dd64ac604e76a9d8d32ea281e29cce3928 +size 561079144 diff --git a/full_models/frd/G_100000.pth b/full_models/frd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bd96994baafa27122530f927830ecf6b22c9ce2a --- /dev/null +++ b/full_models/frd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf1c5bbd402bd88cd2bd9be694c686c8b7afbc054eb06b53e2df199eb796ed7b +size 436359137 diff --git a/full_models/frd/config.json b/full_models/frd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/frd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/frd/vocab.txt b/full_models/frd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3755d0efc17e50217e17b29716611f7a3c26d40b --- /dev/null +++ b/full_models/frd/vocab.txt @@ -0,0 +1,29 @@ +b +v +o +m +ꞌ +j +e +d +f +z +n +l +p +h +c +w +r +k + +a +i +' +_ +- +y +u +t +s +g diff --git a/full_models/ful/D_100000.pth b/full_models/ful/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..c70f5bf038c1059125aabefab7d6868c169386fa --- /dev/null +++ b/full_models/ful/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a750fd360239b86fb05646c8bf6533be0b641717982d187b49173e8f4dd0ed6 +size 561078884 diff --git a/full_models/ful/G_100000.pth b/full_models/ful/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..29b5a45050a3e2e9ff7187b63803b2cb94d263cf --- /dev/null +++ b/full_models/ful/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ccac3bbd0ac31ba6d7a665947a658bd21a1ffb50a706d610d308aee3751cdec +size 436389248 diff --git a/full_models/ful/config.json b/full_models/ful/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ful/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ful/vocab.txt b/full_models/ful/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..1d4276822594caa858b23c9e87f837542799dd1b --- /dev/null +++ b/full_models/ful/vocab.txt @@ -0,0 +1,41 @@ +| +a +o +i +e +n +m +u +ɗ +k +d +l +r +y +ɓ +w +t +g +h +' +s +b +j +f +c +p +ƴ +0 +‐ +ŋ +4 +1 +2 +5 +3 +6 +7 +9 +8 +— + diff --git a/full_models/gag-script_cyrillic/D_100000.pth b/full_models/gag-script_cyrillic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..939b278404d840a4dc6f2bef6d17c947b9ba88a8 --- /dev/null +++ b/full_models/gag-script_cyrillic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ac86483ebe752b085ddf9779f5ac8e268928f09ec3f0866971e3bc0d51bd5c +size 561079250 diff --git a/full_models/gag-script_cyrillic/G_100000.pth b/full_models/gag-script_cyrillic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..714f14d5c028af5af92e0f9ac669cdd7c823a88e --- /dev/null +++ b/full_models/gag-script_cyrillic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6931c93e02ed471e30919b661ce5567cfa7092debfaa7fdfaaf3024d56ce620a +size 436380621 diff --git a/full_models/gag-script_cyrillic/config.json b/full_models/gag-script_cyrillic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gag-script_cyrillic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gag-script_cyrillic/vocab.txt b/full_models/gag-script_cyrillic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b0fb3b79b64d43d06911cac4152b711726c7228c --- /dev/null +++ b/full_models/gag-script_cyrillic/vocab.txt @@ -0,0 +1,36 @@ +л +н +с +з +у +ш +ы +о +_ +ӱ +б +ж +д +к +е +п +р +– +г + +ӓ +ӧ +ч +ф +и +й +ц +т +ӂ +в +' +м +- +х +э +а diff --git a/full_models/gag-script_latin/D_100000.pth b/full_models/gag-script_latin/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..865ec66b82d6e694e6fc4556ca9f06598c4840da --- /dev/null +++ b/full_models/gag-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba3c09615cf76ee61012436985601bd6a5fd3ef6c82235fd40f67d7c9ab29b7 +size 561078503 diff --git a/full_models/gag-script_latin/G_100000.pth b/full_models/gag-script_latin/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..dfc19207333fd1dcd8b872fe2493848c45db4433 --- /dev/null +++ b/full_models/gag-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692cdc279148c5c24c6c62763a50b79a906c74b38ddb39963075cf9c681edbec +size 436377669 diff --git a/full_models/gag-script_latin/config.json b/full_models/gag-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gag-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gag-script_latin/vocab.txt b/full_models/gag-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5c17fcd05c51554751e5a5744ab36e1a2529e977 --- /dev/null +++ b/full_models/gag-script_latin/vocab.txt @@ -0,0 +1,38 @@ +| +a +n +і +r +e +l +d +ı +k +s +m +o +ä +u +t +b +z +y +ü +h +ş +g +ç +p +v +c +ö +ê +i +̇ +f +– +- +ţ +j +' + diff --git a/full_models/gai/D_100000.pth b/full_models/gai/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4c320391c26ca112ab0f8c9a8b39aad0d08ac1a --- /dev/null +++ b/full_models/gai/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:128ae53c3d0d31e27063c6325acc51cfae1ca7d002630e40ee56590be0f42d01 +size 561078580 diff --git a/full_models/gai/G_100000.pth b/full_models/gai/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..07aebee32bda83c48774109d02d01b8d4b75d15c --- /dev/null +++ b/full_models/gai/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c495fcfdc593e7010fadce5bda04f55ed101885a184f4a53fef4d3fece5b594 +size 436366642 diff --git a/full_models/gai/config.json b/full_models/gai/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gai/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gai/vocab.txt b/full_models/gai/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7750077184ea0654f4f4f70b06652de66a32af30 --- /dev/null +++ b/full_models/gai/vocab.txt @@ -0,0 +1,33 @@ +m +5 +t +r +o +7 +g +c +e + +' +ɨ +l +ŋ +_ +0 +k +n +9 +a +i +u +3 +1 +b +8 +w +d +p +6 +s +4 +2 diff --git a/full_models/gam/D_100000.pth b/full_models/gam/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91f5687bbdf3ab3ef07d13fc6ff333e9d62b1e16 --- /dev/null +++ b/full_models/gam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:125aae404899c96b040bbc36d1a1035313fd98b5ffc17ed1aab149594451991d +size 561079102 diff --git a/full_models/gam/G_100000.pth b/full_models/gam/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f24c69f614adce8adda84f0f14ee5469f5484b57 --- /dev/null +++ b/full_models/gam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ebd9275205aae852f79bf6803c0c31b1f9b2ddc648532861305bb5e003bbb6 +size 436367632 diff --git a/full_models/gam/config.json b/full_models/gam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gam/vocab.txt b/full_models/gam/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9da680c9dfa07b18b51634b98c027c2e1de33097 --- /dev/null +++ b/full_models/gam/vocab.txt @@ -0,0 +1,32 @@ +u +m +k +i +t +1 +g +3 +b +8 +- +_ +r +w +4 +7 +s +j +0 +d +e + +2 +y +o +l +6 +9 +n +a +p +5 diff --git a/full_models/gau/D_100000.pth b/full_models/gau/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a47d0c0f827f30e2d1f106e69038c08a624850a5 --- /dev/null +++ b/full_models/gau/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd35cab4be53e05edef640353a8ea5dc227a62375c08e785ece678ba08eca897 +size 561079150 diff --git a/full_models/gau/G_100000.pth b/full_models/gau/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8e46ab7f0e55ef3106ff716278f1f2455d200797 --- /dev/null +++ b/full_models/gau/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd599b1513c182beafa8e6aa0a5a047a07c510f48a0a2ae7d24cd4a25fc1e43c +size 436434468 diff --git a/full_models/gau/config.json b/full_models/gau/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gau/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gau/vocab.txt b/full_models/gau/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ab7679fa409f3bf57a417cb156a859546c202e7c --- /dev/null +++ b/full_models/gau/vocab.txt @@ -0,0 +1,61 @@ +ఔ +ణ +మ +ఒ +ఓ +హ +త + +చ +ఫ +ల +ష +బ +ఉ +ఐ +డ +గ +ఎ +ఖ +ూ +న +ద +భ +‍ +ా +క +ౌ +ృ +ే +ప +ె +ఞ +ు +ఆ +ీ +ఘ +్ +ి +ధ +' +ట +య +జ +ఏ +ఇ +ఈ +ః +_ +శ +ళ +ో +థ +ం +స +ఊ +ొ +ర +ఠ +వ +అ +ై diff --git a/full_models/gbi/D_100000.pth b/full_models/gbi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..997cd55e11d41fb288340291f2b69bf31f4c815e --- /dev/null +++ b/full_models/gbi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9442ee32e38095a4c0184d39e9189d8999c722eab95aac8f9cc3169b9c6410 +size 561109457 diff --git a/full_models/gbi/G_100000.pth b/full_models/gbi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8dbe09e0c4e88acfd457e436d06b559989f25055 --- /dev/null +++ b/full_models/gbi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36be0b1a720b604dc4c1402fbd63ff4129ba0c9a0978149315f8126c74b11dce +size 436604469 diff --git a/full_models/gbi/config.json b/full_models/gbi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gbi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gbi/vocab.txt b/full_models/gbi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0b3241de4606b75c6701affb781f91ad6cfbb9bb --- /dev/null +++ b/full_models/gbi/vocab.txt @@ -0,0 +1,34 @@ +| +a +o +i +n +e +g +m +k +s +u +d +l +w +t +r +b +y +h +p +ḋ +c +j +f +- +' +z +4 +0 +1 +2 +5 +6 + diff --git a/full_models/gbk/D_100000.pth b/full_models/gbk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9a0007c76d2f7a2639afb8d6c11fb2f39abb81a1 --- /dev/null +++ b/full_models/gbk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4afc0f6453e7b289c1938e58026a6643d37ff46fc507387b7682f40aeb7752c +size 561079471 diff --git a/full_models/gbk/G_100000.pth b/full_models/gbk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81c0e7de40b0a1253bf2078b3328152dd3ad2697 --- /dev/null +++ b/full_models/gbk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f87da373c7b7149bf8c4426f7bf90dc1535c206c62923f636f0e181171db26c +size 436447952 diff --git a/full_models/gbk/config.json b/full_models/gbk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gbk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gbk/vocab.txt b/full_models/gbk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a78f4e5901c786c8bb4981db863c98f7376eda0e --- /dev/null +++ b/full_models/gbk/vocab.txt @@ -0,0 +1,66 @@ +ञ +ओ +ब +े +त +' +औ +ू +इ +ऊ +र +ळ +ड +आ +घ +प +फ +ौ +ि +ल +द +6 +न +अ +य +ै +ढ +– +- +स +व +ग +क +उ +च +ष +ट +ऑ +भ +ऐ +ण +छ +‍ +झ +् +थ +ँ +ध +ङ +ह +़ +ो +ी +श +ख +ृ +ा +ज +ए +ं +म +ठ +ु +_ +ई + diff --git a/full_models/gbm/D_100000.pth b/full_models/gbm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..574e059d9ce0a9dd635570a2b88b4fd45307e15b --- /dev/null +++ b/full_models/gbm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea527b1b109ef3123c18fbabb382a0ed7722044a142b938252cf182f9492fca +size 561078083 diff --git a/full_models/gbm/G_100000.pth b/full_models/gbm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b63f7d99774c2b4c8397b9a57eddafdb83d1de47 --- /dev/null +++ b/full_models/gbm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7860be83360aa3dadb03eed164fed75810f7f6e0360c059b74fd3bb89ac83c6 +size 436437813 diff --git a/full_models/gbm/config.json b/full_models/gbm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gbm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gbm/vocab.txt b/full_models/gbm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6a0f1e2b3d5b65e6ca5e17c7f984570eac28dafe --- /dev/null +++ b/full_models/gbm/vocab.txt @@ -0,0 +1,65 @@ +| +ा +र +क +ि +ं +म +ु +् +त +ी +ल +न +ै +प +व +े +द +ब +स +ो +य +ज +ह +अ +श +च +ण +ग +ट +छ +भ +ख +ू +ड +़ +ौ +उ +ऊ +आ +इ +ध +फ +ए +थ +ठ +ई +ष +- +ढ +झ +घ +ऐ +औ +ँ +ञ +ओ +ृ +ः +ळ +‍ +5 +0 +9 + diff --git a/full_models/gbo/D_100000.pth b/full_models/gbo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d792f85495b3e1c83e9d866135edf99b3f09562 --- /dev/null +++ b/full_models/gbo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74136c43d53c2f6597c6d90df76f6533401002065accaf3739cc4b5a6a5124b1 +size 561078985 diff --git a/full_models/gbo/G_100000.pth b/full_models/gbo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ee9e23b02a2f906c22a2dcbdb338dda7df10876d --- /dev/null +++ b/full_models/gbo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e3e4a748be0b4d172e46c9fd4a862edce827454afc3409450a0832f3ca7d6a0 +size 436397509 diff --git a/full_models/gbo/config.json b/full_models/gbo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gbo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gbo/vocab.txt b/full_models/gbo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c626a5f4e2b760906bf5ff22398160b113f18792 --- /dev/null +++ b/full_models/gbo/vocab.txt @@ -0,0 +1,45 @@ +ǎ +p +a + +s +w +m +ï +ä +e +d +j +ɕ +h +n +i +̀ +ü +g +y +_ +b +c +ǒ +k +t +ì +à +è +ɛ +u +' +ɔ +- +o +l +ě +ò +č +f +ù +̌ +ǔ +̈ +ǐ diff --git a/full_models/gde/D_100000.pth b/full_models/gde/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7f2a32473fc130b6923727ec90ef9c7c7cf926d --- /dev/null +++ b/full_models/gde/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61f57a6a58fd9e7dc561f06dc8e0ace0d69eaa1b101161c810d15afdaadca191 +size 561110261 diff --git a/full_models/gde/G_100000.pth b/full_models/gde/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2af15d0e521cf747d7bb0b092c1f90c8e3e73100 --- /dev/null +++ b/full_models/gde/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c296cab64b6abfce43606553ef2984ddd2b72994adfdc7e9a92e3b54962a54 +size 436616917 diff --git a/full_models/gde/config.json b/full_models/gde/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gde/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gde/vocab.txt b/full_models/gde/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f580ea1a150d486e017f0150be3200c9c5ab9320 --- /dev/null +++ b/full_models/gde/vocab.txt @@ -0,0 +1,38 @@ +| +a +ə +i +n +k +t +u +m +s +g +d +ŋ +y +h +o +c +w +' +l +e +r +p +b +ɗ +j +z +f +v +ɓ +- +1 +2 +8 +5 +4 +7 + diff --git a/full_models/geb/D_100000.pth b/full_models/geb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4786401e8ee52d3f0ebe7402a51a7acc01605dda --- /dev/null +++ b/full_models/geb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d443cc77fe3ce3419d643a6492a4ed860d6398eb90034b9ba400e837c996eea9 +size 561106269 diff --git a/full_models/geb/G_100000.pth b/full_models/geb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..272d4df5970e8ac251cb6e013b9f4e83306cef3e --- /dev/null +++ b/full_models/geb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433a9c53110d0121c5c97ed24f54cca865f9b56c0c9c9ae96f3df29fe6be0886 +size 436577590 diff --git a/full_models/geb/config.json b/full_models/geb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/geb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/geb/vocab.txt b/full_models/geb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e7815670a32ab40a64827db9d7854f206a03a24c --- /dev/null +++ b/full_models/geb/vocab.txt @@ -0,0 +1,34 @@ +| +a +i +n +g +m +u +r +e +h +b +à +k +v +ç +z +t +d +s +p +o +f +w +å +0 +1 +' +2 +5 +3 +4 +9 +8 + diff --git a/full_models/gej/D_100000.pth b/full_models/gej/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b9a5d93355322a2d1fba0c50c03eca8055bc69de --- /dev/null +++ b/full_models/gej/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122c0167dd0a3fd1a0873915b9b457c95732357e675767d5e0c62b14ba0a0c8c +size 561110117 diff --git a/full_models/gej/G_100000.pth b/full_models/gej/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..39f6cc63a431ac45e734a1c4edd95660deda818b --- /dev/null +++ b/full_models/gej/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a0e9a8f21281a251d9be8bf8e2bf566a6cc7f6344abe94d367a90641cf9cc74 +size 436633915 diff --git a/full_models/gej/config.json b/full_models/gej/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gej/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gej/vocab.txt b/full_models/gej/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..765b7333d011cc3933b42da809e8abfccb2e6919 --- /dev/null +++ b/full_models/gej/vocab.txt @@ -0,0 +1,45 @@ +| +a +e +o +è +ɔ +n +m +̀ +u +k +ɛ +b +w +i +l +à +y +- +t +s +ɖ +g +̃ +ì +j +ù +ò +ŋ +v +d +p +ã +f +r +h +x +z +c +ũ +đ +ĩ +ƒ +í + diff --git a/full_models/gil/D_100000.pth b/full_models/gil/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..483c6a30ba1152c11ef2e2cd079cdc8c6d31bb02 --- /dev/null +++ b/full_models/gil/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e9f683ce2dcdb6b693a20e24060b6fac5dcd17ef5e3f520cea04d7c23ea7d9 +size 561078754 diff --git a/full_models/gil/G_100000.pth b/full_models/gil/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6b03ef02fa0cd886a11f08b766f16f447eb2f6ad --- /dev/null +++ b/full_models/gil/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166eb9ece9a2c031928265b70629788b9ee8e008f50d43d5b418bda11997ad1c +size 436355288 diff --git a/full_models/gil/config.json b/full_models/gil/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gil/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gil/vocab.txt b/full_models/gil/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..79c361131a1ce7bc8ab75b0173818e14a9d79f41 --- /dev/null +++ b/full_models/gil/vocab.txt @@ -0,0 +1,27 @@ +5 +1 +b +2 +p +t +w +u +7 +0 +a +k +q +g +s +r +- +4 +n +m + +o +_ +' +e +3 +i diff --git a/full_models/gjn/D_100000.pth b/full_models/gjn/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..39a55d9f84a18dbc871419f7a632f2b7773a88dd --- /dev/null +++ b/full_models/gjn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67102a12f76037db79fe059b8c5c2e950475e0346fa7ceb688d870483643fb79 +size 561078099 diff --git a/full_models/gjn/G_100000.pth b/full_models/gjn/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9ea6563e3492bb3a80d0877c3bb47e1c2cf36ed --- /dev/null +++ b/full_models/gjn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:290df094d5145f7e68c35a6492150a3dce246b3a8f492d52530ba622db5b8af4 +size 436359159 diff --git a/full_models/gjn/config.json b/full_models/gjn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gjn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gjn/vocab.txt b/full_models/gjn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d605491c9e29a44eb701338b655a379d2562b7b0 --- /dev/null +++ b/full_models/gjn/vocab.txt @@ -0,0 +1,31 @@ +| +a +n +e +b +ɛ +k +o +m +i +s +ŋ +u +l +r +ɔ +t +y +h +p +d +w +f +g +j +c +z +v +' +- + diff --git a/full_models/gkn/D_100000.pth b/full_models/gkn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..590b6a2e944633dcde9ce66d63f5d2e4ced9de51 --- /dev/null +++ b/full_models/gkn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a769fc0ab9bfc650b8991c8344fdd3b5b9ba7848b47c58ee9f5a843df77c71e0 +size 561110124 diff --git a/full_models/gkn/G_100000.pth b/full_models/gkn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9be3f81ef14d0f698394681a63e8f3e7517af65f --- /dev/null +++ b/full_models/gkn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccc31cbd3f96ee1d33e29124d8dba2e8a7438cd34819cf22a3ec3d409fe06bb +size 436654695 diff --git a/full_models/gkn/config.json b/full_models/gkn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gkn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gkn/vocab.txt b/full_models/gkn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0a597aaf7abdef0881b8839240d25f99c04eb36d --- /dev/null +++ b/full_models/gkn/vocab.txt @@ -0,0 +1,55 @@ +| +b +e +n +a +l +á +à +k +g +ọ +è +o +ó +é +m +í +d +t +i +ò +̀ +ẹ +v +ì +́ +s +p +ú +u +r +y +z +õ +ã +ù +ẽ +ĩ +ṍ +j +f +̄ +̃ +ń +ʽ +ḿ +h +- +ṹ +' +ũ +ʻ +ǹ +ỳ + diff --git a/full_models/gld/D_100000.pth b/full_models/gld/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9ce6376fe9a0da792dc6560c3c9d3fabcd96c3f4 --- /dev/null +++ b/full_models/gld/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d70df9ec3160359dbb414f8f4b5ba5a0d9090f55d3b38d5e12294da9162718 +size 561076020 diff --git a/full_models/gld/G_100000.pth b/full_models/gld/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f91be88fa16a9f284f7c3abe5dda5fc84b1b85a3 --- /dev/null +++ b/full_models/gld/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94212dd7c09fb399877b10459146a7cfc3d271002b56c89713e65755b4f6a2ae +size 436349881 diff --git a/full_models/gld/config.json b/full_models/gld/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gld/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gld/vocab.txt b/full_models/gld/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f59709e48ae8086c075fea32ed0b478c1e07c865 --- /dev/null +++ b/full_models/gld/vocab.txt @@ -0,0 +1,34 @@ +| +и +а +э +н +д +у +с +о +м +ч +л +б +р +т +й +г +х +к +в +ӈ +ё +п +- +я +е +ю +ф +– +з +ь +' +ц + diff --git a/full_models/glk/D_100000.pth b/full_models/glk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fefa02a2ec51fa0daaa94acaa77daa9a16610d38 --- /dev/null +++ b/full_models/glk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27b04bc7750459eedd9fa38ab79d2444249ae599f63559ebcb390b66f5127ff1 +size 561076186 diff --git a/full_models/glk/G_100000.pth b/full_models/glk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e362aa32c3b228bfd45850532278492f6e5a1ee0 --- /dev/null +++ b/full_models/glk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78d25da6a6f79f4bdb0d26996f22e5cb6229eebf826fd777741f2df0bd0cb55 +size 436362665 diff --git a/full_models/glk/config.json b/full_models/glk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/glk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/glk/vocab.txt b/full_models/glk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bbdb33bb48c35b7cadeba9378e4bacf5e710e64c --- /dev/null +++ b/full_models/glk/vocab.txt @@ -0,0 +1,39 @@ +ٚ +م +س +_ +ص +ؤ +د +ز +غ + +گ +پ +ئ +ظ +ث +و +ذ +ق +آ +ا +خ +ت +ب +ک +ج +ش +ع +ل +ض +ط +- +چ +أ +ه +ر +ف +ح +ن +ی diff --git a/full_models/gmv/D_100000.pth b/full_models/gmv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..29f0fcbb86d99ca1efdccd9ae5c01580568fb81f --- /dev/null +++ b/full_models/gmv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa5bbb629ffe72a0fe671b4963b4b6734c301366bf3c10ba97362538805f6f1 +size 561110004 diff --git a/full_models/gmv/G_100000.pth b/full_models/gmv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8f29aeb9877619aa47ed8dbfbdb9f27068a0b376 --- /dev/null +++ b/full_models/gmv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4daf0567575d53a2ef27882e852228f73467985f4d1cf48ffbf544946668344a +size 436599085 diff --git a/full_models/gmv/config.json b/full_models/gmv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gmv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gmv/vocab.txt b/full_models/gmv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..db5db51bbca217466cc3bbb9e58e3ce4887ee2ed --- /dev/null +++ b/full_models/gmv/vocab.txt @@ -0,0 +1,31 @@ +a +| +i +s +e +t +o +n +d +h +y +k +g +m +l +u +z +r +b +p +q +w +x +c +f +7 +j +- +2 +1 + diff --git a/full_models/gna/D_100000.pth b/full_models/gna/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f82d18aeb8f34a1cd4f071cc0c3d3dafc9021dbc --- /dev/null +++ b/full_models/gna/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:324ed04b66bc38e7a7a8306b2d9e28d6c21350685ab094526e9fd3263674c441 +size 561078617 diff --git a/full_models/gna/G_100000.pth b/full_models/gna/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe05a153f17f20d262b2dae10b51de6ea7507e59 --- /dev/null +++ b/full_models/gna/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da69a62a666c66a4724efcdad878bc46d7b88bdcc1c272cfc24552b9ac0ac09a +size 436426689 diff --git a/full_models/gna/config.json b/full_models/gna/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gna/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gna/vocab.txt b/full_models/gna/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e229eaf9d83b1b00d319542fbae040f8adf8f7a7 --- /dev/null +++ b/full_models/gna/vocab.txt @@ -0,0 +1,59 @@ +l +ó +z +ŋ +ɩ +ĩ +n + +õ +j +f +i +v +á +b +ʋ +k +– +ě +u +́ +û +r +ɔ +g +ɛ +̌ +̂ +e +ǎ +é +ô +h +̃ +c +ǐ +w +í +a +î +m +_ +ṹ +o +s +ũ +ú +- +â +ǒ +y +d +ê +ṍ +ɲ +ã +p +t +' diff --git a/full_models/gnd/D_100000.pth b/full_models/gnd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..45168787683c13c6390b63634a913cbb956d7972 --- /dev/null +++ b/full_models/gnd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9187359c1ef944da883255035059c2d562a0c5f541a6e4d33ee6659aa6d089e +size 561109109 diff --git a/full_models/gnd/G_100000.pth b/full_models/gnd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e5b1c1a1d817e4e03ba4864458f28a07e6abf56d --- /dev/null +++ b/full_models/gnd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7040139dc33cf21d0183d29b84b3af4757e9a030a252bef9ff9dd301d96c82 +size 436606523 diff --git a/full_models/gnd/config.json b/full_models/gnd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gnd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gnd/vocab.txt b/full_models/gnd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..87c47bdc15179998baeee9a079d2f4713f849fdf --- /dev/null +++ b/full_models/gnd/vocab.txt @@ -0,0 +1,35 @@ +| +a +m +k +à +t +e +r +i +ə +g +u +l +s +d +n +b +w +y +ŋ +z +̀ +ɗ +ì +h +è +v +f +p +ù +ɓ +' +o +ɂ + diff --git a/full_models/gng/D_100000.pth b/full_models/gng/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b400831c63025809017c99d9e5b2052ad4e8e4e --- /dev/null +++ b/full_models/gng/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a87f0cd8eea7cb889867e34fe48b2f2cb31161e2d364cbdfd96dd7a501cc359 +size 561078752 diff --git a/full_models/gng/G_100000.pth b/full_models/gng/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4b2ee0778086001b2e82da1ec7b982c109e69524 --- /dev/null +++ b/full_models/gng/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8ec5fdd10528243286ccaf6f30d5de326fe2b3f2c9d27bbc5bf31a48172cd4 +size 436396369 diff --git a/full_models/gng/config.json b/full_models/gng/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gng/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gng/vocab.txt b/full_models/gng/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b27c88a73d35b2c13a7e77d775d9df07ef425f73 --- /dev/null +++ b/full_models/gng/vocab.txt @@ -0,0 +1,44 @@ +| +n +i +a +b +ɛ +e +k +u +ɔ +t +l +y +m +o +' +w +r +s +d +h +à +ʼ +p +í +j +g +ŋ +c +f +ń +ì +ñ +̀ +é +ù +è +ó +á +- +́ +ò +ú + diff --git a/full_models/gof-script_latin/D_100000.pth b/full_models/gof-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dc1e0c794c5fc1fd12745fb216db2fc3ff45ef00 --- /dev/null +++ b/full_models/gof-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef9455c0fc72faea8f90d54736ce4813ffa7bb5166a640d2861ccbc7b311ca8f +size 561078765 diff --git a/full_models/gof-script_latin/G_100000.pth b/full_models/gof-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9bdedcc7896837b5b0a1d3a2a25e3d40f85406e4 --- /dev/null +++ b/full_models/gof-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cf78c939d588893c2867aff2b1d6b3caee86ea9deda47414226925bd7b6b318 +size 436360622 diff --git a/full_models/gof-script_latin/config.json b/full_models/gof-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gof-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gof-script_latin/vocab.txt b/full_models/gof-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4583adbe868976cae5f99e08469291ab17014092 --- /dev/null +++ b/full_models/gof-script_latin/vocab.txt @@ -0,0 +1,29 @@ +a +| +i +s +e +n +o +t +h +y +d +k +u +g +m +b +l +r +w +7 +p +q +x +c +f +z +j +- + diff --git a/full_models/gog/D_100000.pth b/full_models/gog/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cdcf9feda0a2fd000d12e29cd038dc4cc125cecf --- /dev/null +++ b/full_models/gog/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8f3271bbfe0c659429156dd0bb6c1faa13e799f458173277eeb573a70bf010 +size 561109986 diff --git a/full_models/gog/G_100000.pth b/full_models/gog/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..68404f7654466a10f5e89421b9c62eba06881a88 --- /dev/null +++ b/full_models/gog/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32d0ab8071576be8d538cb97e2474d98344d47bcdb2f948189166503d6acc923 +size 436591669 diff --git a/full_models/gog/config.json b/full_models/gog/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gog/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gog/vocab.txt b/full_models/gog/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a11f9b15530e428d5359aacef0cf176ed236f2e3 --- /dev/null +++ b/full_models/gog/vocab.txt @@ -0,0 +1,27 @@ +| +a +u +i +n +o +w +e +l +m +y +k +h +g +z +s +t +c +b +v +j +d +p +' +f +- + diff --git a/full_models/gor/D_100000.pth b/full_models/gor/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82f2c3555e89e238b5666575e339673efdef7e3a --- /dev/null +++ b/full_models/gor/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bcce6d8bc15bf53929b4d28112f4dac8f2bcdf1db4279a99687b13f09d62a2 +size 561109866 diff --git a/full_models/gor/G_100000.pth b/full_models/gor/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b546b6088e88bbc41199c8b27c585525990aaba3 --- /dev/null +++ b/full_models/gor/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff9f5a5208e28efe92a5c6fd4337606e011b399ede1680123aaf6a88e291226 +size 436588478 diff --git a/full_models/gor/config.json b/full_models/gor/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gor/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gor/vocab.txt b/full_models/gor/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8036a1b204bb328f37c52426d30b3e64bdce2ac3 --- /dev/null +++ b/full_models/gor/vocab.txt @@ -0,0 +1,27 @@ +| +o +a +l +i +u +t +m +w +n +y +e +g +h +d +b +p +s +' +r +k +- +j +c +z +f + diff --git a/full_models/gqr/D_100000.pth b/full_models/gqr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..39a5ffa7877f9fc46d82ab7195665b199267e009 --- /dev/null +++ b/full_models/gqr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:def396c656adfcc638065292c1f30a5b867ef7e52f30800e525fe1c5e01b79f4 +size 561079011 diff --git a/full_models/gqr/G_100000.pth b/full_models/gqr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b7c0acf63b728cc2c9df9496ed0161c8a31ce37 --- /dev/null +++ b/full_models/gqr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11b27448ba462744a33ddceac5834d1ac8b44cc6512c4cf3ca8539b14dcd5cb0 +size 436361725 diff --git a/full_models/gqr/config.json b/full_models/gqr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gqr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gqr/vocab.txt b/full_models/gqr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..aef5a81d31a84b6e3dc31376742ef36d250a294e --- /dev/null +++ b/full_models/gqr/vocab.txt @@ -0,0 +1,29 @@ +e +h + +ɨ +k +' +p +r +u +ɓ +j +ɔ +i +o +- +n +a +w +ɗ +s +g +_ +d +t +l +m +b +y +ə diff --git a/full_models/grc/D_100000.pth b/full_models/grc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a3a42977aee708cc511e2bf6c5926e05d8982d95 --- /dev/null +++ b/full_models/grc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4722d136586a1fefc49b10c50c4b7bba5a77f9752fe8802880847cd166050570 +size 561079501 diff --git a/full_models/grc/G_100000.pth b/full_models/grc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c8c0ceb47a237948a92d892a6c4f09d4d5d3c58a --- /dev/null +++ b/full_models/grc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc74fe5ad36a8b13f90a68026b555c1ecf68c2bb59eb73762d87bfbb6bd2b665 +size 436571736 diff --git a/full_models/grc/config.json b/full_models/grc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/grc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/grc/vocab.txt b/full_models/grc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f0ae19e6f1f18b5da8109794d14f778b25ccb5f8 --- /dev/null +++ b/full_models/grc/vocab.txt @@ -0,0 +1,119 @@ +ἤ +ὡ +ρ +ὗ +ᾧ +ψ +ἶ +ἄ +ὢ +θ +ὑ +– +ά +ῇ +π +έ +ἢ +ᾠ +ᾅ +η +γ +- +ξ +ς +κ +ὒ +μ +ΰ +ὓ +ὠ +ὼ + +ἔ +ὸ +ὶ +ὄ +ᾶ +ΐ +ᾳ +λ +υ +ἁ +ὔ +ὅ +τ +ἧ +β +ἓ +ἆ +ᾗ +ᾑ +ῆ +ἱ +ἐ +ἀ +χ +σ +ἅ +ᾄ +ἦ +ἑ +ἷ +ῒ +ῄ +ῳ +ῖ +ῷ +ὁ +ῥ +φ +ή +ὰ +ύ +ζ +ὧ +ὤ +ἂ +ο +ἣ +ἰ +ὖ +' +ῶ +ό +ἳ +ἕ +ἠ +δ +ἃ +ῴ +ί +ι +ἡ +ὐ +ϋ +ὀ +ε +ὃ +ᾖ +ν +ὥ +ῦ +α +ϊ +ᾔ +ὴ +ω +ἵ +ᾐ +ἴ +ὕ +ἥ +ὲ +ὦ +ώ +ᾷ +ῃ +ὺ +_ diff --git a/full_models/gri/D_100000.pth b/full_models/gri/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..907ca525b2f0f32875e91f7b2aff2892b03473d9 --- /dev/null +++ b/full_models/gri/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690cf81f5d5b67a3344cc4b33b71d7d26bb7af8d68eadf958f9b1e8634f21f82 +size 561078757 diff --git a/full_models/gri/G_100000.pth b/full_models/gri/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f88ac042d99827a293254978d75287c5fda2b9ad --- /dev/null +++ b/full_models/gri/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f377f2895dc75ca799dcec5fcef03b217c33b646351618d0b8e3404a6d1a4a09 +size 436361086 diff --git a/full_models/gri/config.json b/full_models/gri/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gri/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gri/vocab.txt b/full_models/gri/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b06a2dce38f45ccae938b583d5a6f613537ababc --- /dev/null +++ b/full_models/gri/vocab.txt @@ -0,0 +1,30 @@ +i +a +_ +6 +k +– +r +u +p +l +s +t +1 +m +b +d +e +v +g +j +h +n +o +4 +2 +- +' +q + +0 diff --git a/full_models/grn/D_100000.pth b/full_models/grn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..83ed57c445ae56a541588e2155cb17bcf11b3117 --- /dev/null +++ b/full_models/grn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cddbae0b20fc64b4f52179acbc5c5899c5e869b11f1ae57f7d469686b4fc0d62 +size 561079084 diff --git a/full_models/grn/G_100000.pth b/full_models/grn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ba75cefc3a581c421f745c35a1833d0b2a1c00b4 --- /dev/null +++ b/full_models/grn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc61527119b01d174f675bf5a31ab9221be138c1a6b1b9d782ef7e8182ec2ad2 +size 436416104 diff --git a/full_models/grn/config.json b/full_models/grn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/grn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/grn/vocab.txt b/full_models/grn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3e48853adc1b87cc02d5fb122a63bfd23d3d8df6 --- /dev/null +++ b/full_models/grn/vocab.txt @@ -0,0 +1,53 @@ +3 +ñ +m +l +ỹ +ũ +h +k +6 +8 +a + +ẽ +v +ý +d +7 +p +n +q +ã +4 +b +1 +0 +ú +9 +f +— +c +j +y +ó +í +é +_ +r +- +e +u +t +5 +2 +i +á +g +' +z +õ +ĩ +o +x +s diff --git a/full_models/grt/D_100000.pth b/full_models/grt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81f8b75b19ce4317b55270968c851a52bb03a30d --- /dev/null +++ b/full_models/grt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d77b92c50601f8ee9955cb6adc65a3b6912cd483f3e22be5e799092e9face86 +size 561109722 diff --git a/full_models/grt/G_100000.pth b/full_models/grt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a7a512d962d4d5b200b41a1663317e89711be77 --- /dev/null +++ b/full_models/grt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604cce8abca554a0fd2dacbd69ac69faf7a1e719a420b5a2b49648095817775b +size 436671286 diff --git a/full_models/grt/config.json b/full_models/grt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/grt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/grt/vocab.txt b/full_models/grt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..898b1f7d796e1879a3e6c14aed46b4162a833065 --- /dev/null +++ b/full_models/grt/vocab.txt @@ -0,0 +1,63 @@ +| +া +ি +ন +ং +্ +ক +ম +ব +র +স +ো +আ +খ +গ +দ +ে +জ +য +় +ল +চ +ত +ু +ই +হ +ও +থ +প +উ +ফ +ী +এ +ৎ +শ +ষ +ট +ূ +অ +- +ৌ +ড +' +ণ +ছ +ধ +ৈ +ঠ +ঘ +ঃ +ভ +ঝ +ঐ +ঙ +ঊ +1 +ঈ +ঁ +s +l +d +a + diff --git a/full_models/gso/D_100000.pth b/full_models/gso/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1c8998bb9eaeddafb5f99844e96cdaa4c63316b5 --- /dev/null +++ b/full_models/gso/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbefb9ef6c955a4aeb3c45fabb765da60eb9b6ac801d978a2b6bd1148ea34bac +size 561110394 diff --git a/full_models/gso/G_100000.pth b/full_models/gso/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed6924d1086f33ad79ea305ae3cdbbf593fb013a --- /dev/null +++ b/full_models/gso/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:034bb5291045b92ede04e0e64792a6602b0dba25cecfc9a605d493dd116a1075 +size 436613900 diff --git a/full_models/gso/config.json b/full_models/gso/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gso/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gso/vocab.txt b/full_models/gso/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d4e32dda1055e6e29a5516e5231098a708971277 --- /dev/null +++ b/full_models/gso/vocab.txt @@ -0,0 +1,36 @@ +| +a +n +ɛ +i +m +ɔ +g +e +h +k +o +w +s +b +t +d +u +l +p +z +y +r +f +- +̂ +j +é +c +ï +v +q +x +è +ë + diff --git a/full_models/gub/D_100000.pth b/full_models/gub/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b214a7a4c2f280f18dad8824f56ab0db28ba0d1 --- /dev/null +++ b/full_models/gub/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa1570f411207c7cafe38e7452a2448e1200cf4e64619bb39e59dcfa5f5a75ab +size 561078612 diff --git a/full_models/gub/G_100000.pth b/full_models/gub/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fbc5451c60c1a13bf9ee635d9dea533065c122dc --- /dev/null +++ b/full_models/gub/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:579c2415cf1f36bb509c15981440677750fd9c40d6e490a754d4ae1db346ec32 +size 436364335 diff --git a/full_models/gub/config.json b/full_models/gub/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gub/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gub/vocab.txt b/full_models/gub/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1f854ffec80612affef65fb53ffd705450852aef --- /dev/null +++ b/full_models/gub/vocab.txt @@ -0,0 +1,32 @@ +à +8 +4 +t +- +k +p +u +1 +0 +x +i +z +3 +_ +a +e +m +' +6 +n +5 +w +g +r +h +o +7 + +9 +2 +y diff --git a/full_models/guc/D_100000.pth b/full_models/guc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..17236f5ec8bf2e4ecaf16c4d909b87f0c2496eb3 --- /dev/null +++ b/full_models/guc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18378319eb3fa331717e8c0859f29f96a5f6bd7c17eab6221619b641ed107a4 +size 561106384 diff --git a/full_models/guc/G_100000.pth b/full_models/guc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f67aa766a1287c139ae1975b9a5086aa7b129095 --- /dev/null +++ b/full_models/guc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19358a57932736d36fb15122425bacbfca892aacc1bafb5c95e949ff3742c8ab +size 436603398 diff --git a/full_models/guc/config.json b/full_models/guc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/guc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/guc/vocab.txt b/full_models/guc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..543e09376464ee58e1e5a90a286ea22a362b3dfa --- /dev/null +++ b/full_models/guc/vocab.txt @@ -0,0 +1,45 @@ +a +| +n +i +ü +e +s +t +k +u +j +l +m +' +o +h +w +p +y +r +c +d +ú +— +b +í +é +g +f +á +ó +0 +v +z +q +1 +2 +x +5 +4 +ñ +3 +6 +7 + diff --git a/full_models/gud/D_100000.pth b/full_models/gud/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8be722c12aa0606a775279a216c8c739d380a0aa --- /dev/null +++ b/full_models/gud/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94e1b94f65f93dd2c6e5ff5a8faf81e1eb68d40b59cb8234435aa4780aa8e83e +size 561078625 diff --git a/full_models/gud/G_100000.pth b/full_models/gud/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b239c94b07fbc29ed8757f8db8af9821a07973e --- /dev/null +++ b/full_models/gud/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1311e8170d5995acccd36b14f1df1c4dd130152bb232aed0a729f1f30257e347 +size 436366680 diff --git a/full_models/gud/config.json b/full_models/gud/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gud/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gud/vocab.txt b/full_models/gud/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e3641fca4d983ae3467c204c94ab93b39929430a --- /dev/null +++ b/full_models/gud/vocab.txt @@ -0,0 +1,33 @@ +| +a +l +n +ɩ +' +ɔ +‐ +y +ɛ +k +ʋ +i +b +m +e +t +g +c +o +h +p +s +u +w +z +d +f +ŋ +j +v +0 + diff --git a/full_models/guh/D_100000.pth b/full_models/guh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b4cbca5ce18384a1eb5f78ec94f56d1f2b15a7a6 --- /dev/null +++ b/full_models/guh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84aedfa8380c369f1b1208a143c22a88d2b16dbf134f63479f40b328a68a2f7 +size 561076195 diff --git a/full_models/guh/G_100000.pth b/full_models/guh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3a02d3bfa3e519bf084ca6f9aca74a858193aba6 --- /dev/null +++ b/full_models/guh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fd273ae933f490426134e5ce7abf8c375c251877a480e64da71feab7186862 +size 436376356 diff --git a/full_models/guh/config.json b/full_models/guh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/guh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/guh/vocab.txt b/full_models/guh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d435da392f4b5e83b8cd6b9bd8314f4e24fb51a8 --- /dev/null +++ b/full_models/guh/vocab.txt @@ -0,0 +1,45 @@ +j +4 +s +y +ó +í +d +_ +- +— + +l +z +' +b +á +h +r +̱ +v +u +m +ë +g +ñ +ú +7 +q +o +­ +t +i +ĩ +õ +c +a +é +n +f +e +w +p +k +x +ã diff --git a/full_models/guj/D_100000.pth b/full_models/guj/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc7868491443b5289fcd4d61f6b8cb150ef98014 --- /dev/null +++ b/full_models/guj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:528ab77fc373c8b31a73f717d5531f24e0eb26c9c18c9f57861e4acf131b1ba3 +size 561079356 diff --git a/full_models/guj/G_100000.pth b/full_models/guj/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c521ea624c587e293e0f4b1178c80bdb5e55686 --- /dev/null +++ b/full_models/guj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3af7925d0672cb81c525beb65563161fc3895a3849ecee9888559f9500849dd +size 436435387 diff --git a/full_models/guj/config.json b/full_models/guj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/guj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/guj/vocab.txt b/full_models/guj/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..af5307892fbac94cc8c58520d36d960662c63003 --- /dev/null +++ b/full_models/guj/vocab.txt @@ -0,0 +1,60 @@ +| +ા +ે +ત +ન +ર +્ +મ +ી +ક +ં +ો +પ +વ +ુ +સ +ય +હ +જ +થ +િ +શ +ણ +છ +લ +દ +આ +ઓ +અ +એ +ઈ +બ +ગ +ખ +ધ +ભ +ટ +ળ +ૂ +ચ +ડ +ષ +ઉ +ફ +ઘ +ઠ +ૃ +' +ઊ +ઇ +ઞ +ઝ +ઢ +ૈ +ઃ +ૌ +- +ઋ +ઐ + diff --git a/full_models/guk/D_100000.pth b/full_models/guk/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..03a652cae2c8e5fdc7be3eaacb8fa0690ed3b45d --- /dev/null +++ b/full_models/guk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbad99f1ce710057bc470004c98d9f97af9842b21a7d9bb80fcfab2d4195d5d2 +size 561078847 diff --git a/full_models/guk/G_100000.pth b/full_models/guk/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..e81c3d02acf943274a69d58ecb303a3a749a0e22 --- /dev/null +++ b/full_models/guk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c5a350565be6554985d64d813a08fde98af9100ae478504b95c0f231841edd +size 436358911 diff --git a/full_models/guk/config.json b/full_models/guk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..993d1dedb1d0c8e820b98f9e2f019ff166327038 --- /dev/null +++ b/full_models/guk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.uroman", + "validation_files": "dev.uroman", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/guk/vocab.txt b/full_models/guk/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..09c467a4acb08779bb0152c2c415e9333fb653c4 --- /dev/null +++ b/full_models/guk/vocab.txt @@ -0,0 +1,28 @@ + +' +- +a +b +c +d +e +f +g +h +i +j +k +l +m +n +o +p +q +r +s +t +u +w +x +y +z diff --git a/full_models/gum/D_100000.pth b/full_models/gum/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ad4cfda49af1bf8a0ea00c6bfcdbdd1308bc7bf --- /dev/null +++ b/full_models/gum/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0755e583b0b39fe2cc3cf7dfd5c4c9d184de3c83bf562281c7fa23a272bcf9d2 +size 561109839 diff --git a/full_models/gum/G_100000.pth b/full_models/gum/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ca2b734f01e3d1daf9ecf7fddd8199c6d0c32997 --- /dev/null +++ b/full_models/gum/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea406973d9699d994463477d4adfeada83625459e1fa606b7cc7e0593f4c31c2 +size 436625202 diff --git a/full_models/gum/config.json b/full_models/gum/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gum/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gum/vocab.txt b/full_models/gum/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5d1190b68dc95ca6f0d3fe7b80e92d7d866369df --- /dev/null +++ b/full_models/gum/vocab.txt @@ -0,0 +1,43 @@ +| +a +i +r +n +e +ø +u +g +m +b +t +s +k +h +c +l +w +p +y +d +o +ñ +ú +j +— +í +z +é +á +' +f +v +- +ó +q +0 +x +1 +2 +4 +3 + diff --git a/full_models/guo/D_100000.pth b/full_models/guo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ca4f1da60e7100a3721b419da1dd01cdb40f4830 --- /dev/null +++ b/full_models/guo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb8c6d8659d41432676c462bef8db5524c8ca4b509147be8e6672061611d268 +size 561109584 diff --git a/full_models/guo/G_100000.pth b/full_models/guo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1ffdcc72e5dcb7f3ae1b43f58e589e5685707b40 --- /dev/null +++ b/full_models/guo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0d2902f625a0643c219c47d0cc9cb74017088960d42408bce36c8449c6894f +size 436613430 diff --git a/full_models/guo/config.json b/full_models/guo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/guo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/guo/vocab.txt b/full_models/guo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1d562c9c2b43ed0d90ef20e60c88b1cdc8e7f6b8 --- /dev/null +++ b/full_models/guo/vocab.txt @@ -0,0 +1,38 @@ +a +| +e +j +i +n +t +l +o +x +s +w +p +m +ʉ +c +h +k +b +d +- +u +r +f +' +y +ú +— +í +g +é +á +v +ó +z +q +ñ + diff --git a/full_models/guq/D_100000.pth b/full_models/guq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7b1582e0923058c9853557399583fe078033ad4 --- /dev/null +++ b/full_models/guq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:597723a03782d4ae4fb5848be50939fc5c4d3aac611d21b3b1d0aa78b4dcaefc +size 561078988 diff --git a/full_models/guq/G_100000.pth b/full_models/guq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f0acdf868eee379af17310941424067967fc1e8f --- /dev/null +++ b/full_models/guq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337005b1db915ee9c7cbdb14ace72f6ee12c8d3acedf874ecfdc38be1995b42e +size 436399337 diff --git a/full_models/guq/config.json b/full_models/guq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/guq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/guq/vocab.txt b/full_models/guq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7bf01d157b12272d04b0e43c215aad24557799de --- /dev/null +++ b/full_models/guq/vocab.txt @@ -0,0 +1,46 @@ +g +0 +l +u +e +o +i +ẽ +s +_ +j +m +f +­ +k +á +ó +í +x +a +— +b +z + +' +c +é +̃ +d +q +– +ũ +ñ +n +1 +5 +h +õ +w +ã +r +t +y +p +ĩ +2 diff --git a/full_models/guu/D_100000.pth b/full_models/guu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..50501b0692af6656fd1adb08624523fc5e8df37e --- /dev/null +++ b/full_models/guu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f42874e915713037a4f31e22412cf4a039970d05ad69b74e07635cbcb0acc696 +size 561078473 diff --git a/full_models/guu/G_100000.pth b/full_models/guu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..23eb5f93b1817377d28b3a3a7fa0cc58ad7e6cf4 --- /dev/null +++ b/full_models/guu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed05d376bb27436aa81353b13f6b9be7e6887a2a1c5cd5771d231640da95ba5 +size 436396619 diff --git a/full_models/guu/config.json b/full_models/guu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/guu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/guu/vocab.txt b/full_models/guu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d463b75101a3ab09bf585723eb4af0abfeec0481 --- /dev/null +++ b/full_models/guu/vocab.txt @@ -0,0 +1,46 @@ +' +r +8 +ä +̦ +s +— +q +a +g +9 +2 +1 + +c +b +5 +7 +ó +n +y +p +í +á +ú +3 +e +4 +ö +_ +l +i +f +j +6 +t +u +0 +h +é +o +m +ñ +v +w +d diff --git a/full_models/gux/D_100000.pth b/full_models/gux/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c2fd9e729c1e0b1f0bc500bf9a78c6ef0de3c063 --- /dev/null +++ b/full_models/gux/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2157b49d8364ff525706d6a9d88cf8f5e76fffd1129eee4300587b31f3df4a +size 561110123 diff --git a/full_models/gux/G_100000.pth b/full_models/gux/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cfddd40a56b901e2d06a36a463d41dd8d2e6c727 --- /dev/null +++ b/full_models/gux/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d82fac6d98286ebae00e721a196f2f9924fa3099399ca7ddea7b2d03aa9a4a +size 436589035 diff --git a/full_models/gux/config.json b/full_models/gux/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gux/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gux/vocab.txt b/full_models/gux/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..db3767d5cc505e1a59391fadc4f3a6a654f13192 --- /dev/null +++ b/full_models/gux/vocab.txt @@ -0,0 +1,27 @@ +| +a +i +n +e +l +u +o +b +d +k +y +m +t +g +p +s +j +c +f +w +ŋ +ñ +h +- +v + diff --git a/full_models/gvc/D_100000.pth b/full_models/gvc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..295755ad67fe027787345f9cec626fa3eb8fcf32 --- /dev/null +++ b/full_models/gvc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e4bd8d8af9dc91f3af6bdfb636a691f224ac7ba646340b3a766ddfd00b8175 +size 561109593 diff --git a/full_models/gvc/G_100000.pth b/full_models/gvc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f4686cdab2613d61c7511799f5ddd24bab0ede71 --- /dev/null +++ b/full_models/gvc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09ce901751ba635a1760317468e3a600bd8205c14ae42ba7255521e6a2a132dc +size 436625042 diff --git a/full_models/gvc/config.json b/full_models/gvc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gvc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gvc/vocab.txt b/full_models/gvc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..81c9f7fb60a8258b018764f953be1fb64414fdc9 --- /dev/null +++ b/full_models/gvc/vocab.txt @@ -0,0 +1,43 @@ +| +a +i +r +u +o +h +e +̶ +t +n +c +m +s +j +y +p +ã +d +w +b +ñ +ũ +g +í +õ +— +l +ĩ +ó +q +f +ẽ +v +é +z +' +á +ú +k +à +x + diff --git a/full_models/gvl/D_100000.pth b/full_models/gvl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9b3104f2df42b799a95e0e5f402b576980b7b62c --- /dev/null +++ b/full_models/gvl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52dc19575f4be67ef115a90066f4155b74b1bbdf6397823d16cfd96dd4091ff5 +size 561109840 diff --git a/full_models/gvl/G_100000.pth b/full_models/gvl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9a0077ca512adcea679b97eaac64b9279a20d51d --- /dev/null +++ b/full_models/gvl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c917185b9c2767dee658a0b4ef5b3073203a5727f055e052c37935372e2e4b +size 436648200 diff --git a/full_models/gvl/config.json b/full_models/gvl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gvl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gvl/vocab.txt b/full_models/gvl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5892a1ccfa4ead392b6b485c208acd73ab64dc78 --- /dev/null +++ b/full_models/gvl/vocab.txt @@ -0,0 +1,53 @@ +| +e +n +a +k +i +d +t +g +o +r +u +m +l +' +è +s +j +é +b +ɔ +ɓ +- +à +w +y +á +ê +p +ò +̂ +h +– +c +ɗ +ó +ú +v +z +ĵ +q +ḿ +̀ +f +x +ŝ +ù +ĝ +š +í +́ +ń + diff --git a/full_models/gwi/D_100000.pth b/full_models/gwi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..78c1855f95a5341c87329cb3511abcb78b48dbf3 --- /dev/null +++ b/full_models/gwi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d276574717af860a043c1e22c1a9aa65fc852f1336a904ecacb042bd6d0dcd39 +size 561078611 diff --git a/full_models/gwi/G_100000.pth b/full_models/gwi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..814241bb1c1e8d2970f3cd9c3039f427dafeef64 --- /dev/null +++ b/full_models/gwi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4a74991c78f8621b537e0cbc6d6aba46a5ff5aee13188775c57d620762747a +size 436396477 diff --git a/full_models/gwi/config.json b/full_models/gwi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gwi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gwi/vocab.txt b/full_models/gwi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..70be38b62e3722d67b49fbc54cfe1a3368758602 --- /dev/null +++ b/full_models/gwi/vocab.txt @@ -0,0 +1,46 @@ +0 +4 +9 +ų +p +8 +v +2 +3 +c +j +' +a +į +ą +q +f +r +- +k +t +l +i +s +_ +g +o +u + +d +ǫ +w +ł +b +7 +n +x +y +z +m +5 +6 +1 +ę +e +h diff --git a/full_models/gwr/D_100000.pth b/full_models/gwr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b59d561748d5007e33ef7664bb747ec2f781f205 --- /dev/null +++ b/full_models/gwr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3745fe1670e8bf8e5db2bf2be1c58d0a3f40affe5c6374b1fd15c8ce7f14757 +size 561078966 diff --git a/full_models/gwr/G_100000.pth b/full_models/gwr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d4348825519978c2136f6cff732344a09b9309c1 --- /dev/null +++ b/full_models/gwr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3edf80d74ef139f33ef5c5d68b223a30221eb60ee0efd34d9898e34faca60853 +size 436382280 diff --git a/full_models/gwr/config.json b/full_models/gwr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gwr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gwr/vocab.txt b/full_models/gwr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..49422de6fee9adabf4eaba37548c9791841ea92d --- /dev/null +++ b/full_models/gwr/vocab.txt @@ -0,0 +1,39 @@ +o +f +y +5 +e +g +4 +a +k +c +n +9 +j +w +0 +z +ŋ +8 +p +m +s +_ +1 +3 +ʼ +6 + +- +u +t +7 +' +r +d +i +v +b +l +2 diff --git a/full_models/gym/D_100000.pth b/full_models/gym/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e913475148735e23745b38f84ac6b3078a8fc46e --- /dev/null +++ b/full_models/gym/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e66b6ac7bfa7a4bd1fd5fddf9d075d046efa60efcebff32034fc5c7f691ba79 +size 561106300 diff --git a/full_models/gym/G_100000.pth b/full_models/gym/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6ea1b8aef021983330cadfaad3803c7d8d213f45 --- /dev/null +++ b/full_models/gym/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a365d652ac4ee5d6fe36ec2aef5f2aedce1c57d6dea77b4232e14d37f0e24e +size 436610618 diff --git a/full_models/gym/config.json b/full_models/gym/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gym/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gym/vocab.txt b/full_models/gym/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..345cc44b3d4519670c705be36bbbfcc7c6a720a5 --- /dev/null +++ b/full_models/gym/vocab.txt @@ -0,0 +1,48 @@ +| +e +a +n +k +i +r +t +ä +b +m +w +u +o +ö +g +d +j +y +s +ü +ñ +l +p +c +é +h +í +f +ó +v +á +z +q +1 +2 +0 +ú +6 +8 +4 +5 +3 +- +9 +x +7 + diff --git a/full_models/gyr/D_100000.pth b/full_models/gyr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..852ac8d7511c1cd320054c83fe45b818a84130c2 --- /dev/null +++ b/full_models/gyr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1656e4e2152a519fd9b16b6e40f79e727db321fc5ad36d5a59bcd4f4a37893dd +size 561110481 diff --git a/full_models/gyr/G_100000.pth b/full_models/gyr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b185ef82687b326eb7d4fa742cadd5b971b452bb --- /dev/null +++ b/full_models/gyr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b881887d051fa45263aa9c02301af9b23dc1802101397eade6fbdd46a04fc4a6 +size 436632204 diff --git a/full_models/gyr/config.json b/full_models/gyr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/gyr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/gyr/vocab.txt b/full_models/gyr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6e4cbb8c1c2789701a0c061da489590ec5b5851a --- /dev/null +++ b/full_models/gyr/vocab.txt @@ -0,0 +1,44 @@ +| +e +a +o +r +i +p +s +v +u +ɨ +k +' +t +m +y +n +b +w +d +ä +g +c +ñ +h +ë +ü +j +̇ +l +ö +ú +ï +í +– +- +é +f +ó +á +z +q +x + diff --git a/full_models/had/D_100000.pth b/full_models/had/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2837a3a4d43a8ca6487e1edd198cc7138400fc85 --- /dev/null +++ b/full_models/had/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e31fa9a6e13aa22588b11a54aa5219e1e312274332b302c3f418727ede11925a +size 561078990 diff --git a/full_models/had/G_100000.pth b/full_models/had/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1dd4dbb7a9d4f44e07ee561d1e2ad6da8f98f041 --- /dev/null +++ b/full_models/had/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23dab10df3a578e154569058e9c4689cd4698ae742e27a27b15ca77e0f5b8ce +size 436355271 diff --git a/full_models/had/config.json b/full_models/had/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/had/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/had/vocab.txt b/full_models/had/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..153f0678ff226c3e0c42ee0ac39c5c5d4431165a --- /dev/null +++ b/full_models/had/vocab.txt @@ -0,0 +1,27 @@ +d +r +c +s +y +b +z +a +h +l +m +i +n +k +_ +- +o +g +' +p +t +w +u + +j +e +f diff --git a/full_models/hag/D_100000.pth b/full_models/hag/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4c8b228751483078e451cb528f61af49eac79e31 --- /dev/null +++ b/full_models/hag/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22b0f33ec10607b7e293180aa46259da8d4d9b7a2cbfe0367fcd878eade7546 +size 561109972 diff --git a/full_models/hag/G_100000.pth b/full_models/hag/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..21123fc4c7a715b0fb9a0fc6eafc0df5564064d1 --- /dev/null +++ b/full_models/hag/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8481c30c11f1f439565ac94bb3d0d6ffe6829527c0ca1f4a9b883f786148894c +size 436595351 diff --git a/full_models/hag/config.json b/full_models/hag/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hag/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hag/vocab.txt b/full_models/hag/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4dc813bb5e48df8bb21c52428610d7368471f3d7 --- /dev/null +++ b/full_models/hag/vocab.txt @@ -0,0 +1,30 @@ +| +a +i +n +e +u +s +m +b +o +y +r +k +l +t +ŋ +d +p +g +z +w +h +j +c +f +v +q +` +- + diff --git a/full_models/hak/D_100000.pth b/full_models/hak/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..96d0cddf1fbbc80b98dc10efd51ec142dcb066c4 --- /dev/null +++ b/full_models/hak/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff0553785e3a9949fc303e7b267951eb222ff1aa54df62a2b6fcc32b38ad061 +size 561110006 diff --git a/full_models/hak/G_100000.pth b/full_models/hak/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4a84cf5c08c18ab864dd81f51ef582ad4c474c03 --- /dev/null +++ b/full_models/hak/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733c29141c9eec577761099160801972e55ce94e30b2a37a504b791b3cb3fbaa +size 436626319 diff --git a/full_models/hak/config.json b/full_models/hak/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hak/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hak/vocab.txt b/full_models/hak/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5038c90bc1cfe5b1368d1f82535db95cc452fbb7 --- /dev/null +++ b/full_models/hak/vocab.txt @@ -0,0 +1,43 @@ +| +n +- +h +i +k +g +t +u +e +c +s +o +ì +a +y +l +m +â +p +ê +ó +ṳ +û +î +à +ò +̍ +á +f +v +ô +ú +ù +è +é +í +` +́ +̀ +̂ +' + diff --git a/full_models/hap/D_100000.pth b/full_models/hap/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d39db0cb647ab2d56cae02f542054573e519d29a --- /dev/null +++ b/full_models/hap/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269f988ecedcb531eeb41fe3edc6cad7f2719c0d1a7c56940c6ea226060635fa +size 561076189 diff --git a/full_models/hap/G_100000.pth b/full_models/hap/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f67c887c17811a9c9cc7b3171135e9eef7d967c --- /dev/null +++ b/full_models/hap/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:017a0a1ba988c517f45c105f26b2bb341f881e2859d2902c01cf831a8de4bd87 +size 436358175 diff --git a/full_models/hap/config.json b/full_models/hap/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hap/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hap/vocab.txt b/full_models/hap/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..15fe5cffd95bf125421c7ee3603c974d661419fa --- /dev/null +++ b/full_models/hap/vocab.txt @@ -0,0 +1,37 @@ +' +t +h +p +2 +8 +4 +a +i +b +m +n +- +d +z + +e +9 +5 +g +c +1 +f +7 +j +u +s +r +l +o +3 +k +y +0 +6 +w +_ diff --git a/full_models/hat/D_100000.pth b/full_models/hat/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..234b8434d16fda1b50f92ae54e5d0252242b255a --- /dev/null +++ b/full_models/hat/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60cfb41f106f51284a67366db3c5fb2600e5d87504b9d2fe1482ee62b4f3a17 +size 561109872 diff --git a/full_models/hat/G_100000.pth b/full_models/hat/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b6dfdcb01c35f6e84ae67d3585bbfbf3985c52da --- /dev/null +++ b/full_models/hat/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6077f195e24a8659b1dad045f93a619f77683f5cb4be4b2d913d9e0f38fe646 +size 436599833 diff --git a/full_models/hat/config.json b/full_models/hat/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hat/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hat/vocab.txt b/full_models/hat/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c4d9fba7e16a0840691c3134b8c0a6863b29b1ec --- /dev/null +++ b/full_models/hat/vocab.txt @@ -0,0 +1,32 @@ +| +n +a +e +o +i +t +l +p +u +y +s +m +k +è +r +d +v +b +w +f +j +ò +g +z +' +h +c +— +à +- + diff --git a/full_models/hau/D_100000.pth b/full_models/hau/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5ca0ff7d21a2b71857a5b85c1027890be9d30276 --- /dev/null +++ b/full_models/hau/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88a46981a912a4eefe6d9e82bca8141994274e36fe930701ea81d793b1d4a16c +size 561110345 diff --git a/full_models/hau/G_100000.pth b/full_models/hau/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8dbf68bbd84d1e1ad2847202896eea21f80948ab --- /dev/null +++ b/full_models/hau/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12ac37a83ccbfc9cf4017bdcfdd37c59098af328a387dfff786c86c58353e77 +size 436610324 diff --git a/full_models/hau/config.json b/full_models/hau/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hau/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hau/vocab.txt b/full_models/hau/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..82df4abd54f42dd3774e901047d566f7e3b353fd --- /dev/null +++ b/full_models/hau/vocab.txt @@ -0,0 +1,34 @@ +d +_ +ɗ +s +g +t +o +y +r +a +u +ā +i +ū +c +n +j +b +ɓ +l +- +6 +e +k +f +ă +' +w +h +z +m +ƙ +ˈ + diff --git a/full_models/hay/D_100000.pth b/full_models/hay/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c7bf4d8df1524980d8647ef4ccef8acf1d8821a0 --- /dev/null +++ b/full_models/hay/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c5eacc991710629c186b2ceafe577a5ccaf2db7092749fd5099c5dda064c0f +size 561110254 diff --git a/full_models/hay/G_100000.pth b/full_models/hay/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2aa291bc72ea4da0c99d8fe86f2388238d37e355 --- /dev/null +++ b/full_models/hay/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b339995b296932b9f7c4fcf6c5b2d5a0397b27d82aee1654190401c521941743 +size 436612528 diff --git a/full_models/hay/config.json b/full_models/hay/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hay/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hay/vocab.txt b/full_models/hay/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a1e714d5e97ec54c851e8b0a9bed1e5c85aec89a --- /dev/null +++ b/full_models/hay/vocab.txt @@ -0,0 +1,36 @@ +a +| +i +u +n +o +e +b +k +m +r +g +w +t +y +h +l +s +' +z +d +j +f +p +c +v +0 +1 +2 +4 +3 +5 +8 +6 +7 + diff --git a/full_models/heb/D_100000.pth b/full_models/heb/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..8c1f4c82ad9fe585c45a9be663a4e741f3b1d7c1 --- /dev/null +++ b/full_models/heb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e84cd15eb75c7a9033be6d9f2ed56d27b715112ab3098f1f2efb20f634a42c03 +size 561079016 diff --git a/full_models/heb/G_100000.pth b/full_models/heb/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f173cea8e4830b31ddf0c650eb6d043a69da7ef7 --- /dev/null +++ b/full_models/heb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced629c3214c15f3d4c09f4464db280c4f0ae4ad10e0708d6664efc760fc8255 +size 436368160 diff --git a/full_models/heb/config.json b/full_models/heb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/heb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/heb/vocab.txt b/full_models/heb/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..d96bb64a23b1fb113d4604078873207dab3787d2 --- /dev/null +++ b/full_models/heb/vocab.txt @@ -0,0 +1,32 @@ +| +ו +י +א +ה +ל +ת +ש +ב +ם +ר +מ +נ +כ +ע +ד +ח +ק +ן +פ +ג +ס +צ +ז +ך +ט +ף +ץ +— +' +- + diff --git a/full_models/heh/D_100000.pth b/full_models/heh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..18b41c8d6fd9f93dc8200829483747375a46f778 --- /dev/null +++ b/full_models/heh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005c5cd906a39d5eb98fb2ae91e30531f710b4eb103fc125ee144480cec6a58a +size 561110116 diff --git a/full_models/heh/G_100000.pth b/full_models/heh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1ffbcd3f43120e989167a349826aa89e5da0228 --- /dev/null +++ b/full_models/heh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb9625772739fc3c9853633f30a8ea0a76dbf87352ad68dfdfbd94be9185d65d +size 436591662 diff --git a/full_models/heh/config.json b/full_models/heh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/heh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/heh/vocab.txt b/full_models/heh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7d1a31a1c5d79dc6458965c662cf8e8358281e56 --- /dev/null +++ b/full_models/heh/vocab.txt @@ -0,0 +1,27 @@ +| +a +i +u +e +n +l +w +k +m +v +g +o +y +s +t +p +h +d +b +f +c +' +z +j +- + diff --git a/full_models/hif/D_100000.pth b/full_models/hif/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8726018f36c1e6bbf2ed33e4186513a6910909bb --- /dev/null +++ b/full_models/hif/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab33b485e08f16e3b5148dbb9147ce5b369aad9fde4ffaa67780d6ae7d48fe4d +size 561110131 diff --git a/full_models/hif/G_100000.pth b/full_models/hif/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..00629483796679c5b5f46648bc0a9f1797846e37 --- /dev/null +++ b/full_models/hif/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a1c04e696185f0cc013c94ac2fce205ea02ef512c9d1e1c58208521c0a3cec9 +size 436619354 diff --git a/full_models/hif/config.json b/full_models/hif/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hif/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hif/vocab.txt b/full_models/hif/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a172408551abfd50201f7bc924a41a217b6134f7 --- /dev/null +++ b/full_models/hif/vocab.txt @@ -0,0 +1,40 @@ +| +a +e +h +i +k +r +u +s +m +n +o +l +b +t +g +p +j +d +y +c +w +ñ +ṭ +ṛ +f +ḍ +z +v +- +' +q +x +0 +4 +1 +6 +– +2 + diff --git a/full_models/hig/D_100000.pth b/full_models/hig/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed89d2beddeb1dc509dd50bdef2ebc9b66956a04 --- /dev/null +++ b/full_models/hig/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c78f3927853aae73d0199b31b11ed2e3d6887c1cb401e0df17aebda7da3e9a7 +size 561110006 diff --git a/full_models/hig/G_100000.pth b/full_models/hig/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49212e7bd8f4cc7779612e440033decdab33ee44 --- /dev/null +++ b/full_models/hig/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d280f923323187f67af368a5ff65a2222ac816d23a9878d3c9f766483bde19 +size 436610638 diff --git a/full_models/hig/config.json b/full_models/hig/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hig/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hig/vocab.txt b/full_models/hig/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ac603bb1f445184cca837a924bbc43a7374889eb --- /dev/null +++ b/full_models/hig/vocab.txt @@ -0,0 +1,36 @@ +| +ə +a +m +i +n +t +w +k +y +l +s +h +r +g +á +b +d +u +z +e +j +v +́ +- +p +f +c +ɗ +ɓ +— +' +ú +o +í + diff --git a/full_models/hil/D_100000.pth b/full_models/hil/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..83bdc13a32c9ecc7332ce3e907ccc102aa3c1756 --- /dev/null +++ b/full_models/hil/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:877092cd6858047f4b1c9b26f7130999687602cbb9c34730e96ee7282f7df3f3 +size 561109997 diff --git a/full_models/hil/G_100000.pth b/full_models/hil/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..32d0e0fd1322e71d6fda47229386c6b83ae26387 --- /dev/null +++ b/full_models/hil/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d19aa3b446271dd8d503d85f6c1ba1b3b0c902a4e959df01b0575b4b4c4fb1 +size 436626289 diff --git a/full_models/hil/config.json b/full_models/hil/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hil/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hil/vocab.txt b/full_models/hil/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8b05f41b21c64949d59dbee29db979e81dc255d2 --- /dev/null +++ b/full_models/hil/vocab.txt @@ -0,0 +1,42 @@ +a +| +n +g +i +s +o +k +m +l +t +u +p +d +y +b +h +r +w +e +- +j +c +0 +f +v +z +q +— +1 +2 +4 +5 +3 +x +9 +6 +7 +' +8 +ñ + diff --git a/full_models/hin/D_100000.pth b/full_models/hin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9aaee4ed2d0bbc083aef15e22b35680ea2640f3b --- /dev/null +++ b/full_models/hin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08350156b24a5adc06b82cd74a9c9e1e19b1c6dabca6e2130b1bd4c7a69a038 +size 561110274 diff --git a/full_models/hin/G_100000.pth b/full_models/hin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eea809f43514f08bb78b25e2bb5641e67a7d95ff --- /dev/null +++ b/full_models/hin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce6460a34e47928a9eb298b75af9fefb47b1bb806294b7f79697f4543e6aa98 +size 436697338 diff --git a/full_models/hin/config.json b/full_models/hin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hin/vocab.txt b/full_models/hin/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d13a34fe8465b49a513728567e18b8dc3ee8ebc --- /dev/null +++ b/full_models/hin/vocab.txt @@ -0,0 +1,72 @@ +फ +4 +1 +- +अ +इ +8 + +0 +छ +न +ए +ऐ +़ +ष +ि +ँ +च +2 +ऑ +थ +भ +ी +‍ +ॅ +3 +ञ +ै +ु +ठ +ं +ॉ +उ +_ +ई +ः +ह +ध +ल +र +स +ब +ख +ण +' +` +व +घ +प +ग +ढ +य +े +् +ा +आ +ड +ज +झ +श +औ +ो +द +ृ +ौ +ऊ +ू +ओ +ट +त +क +म diff --git a/full_models/hlb/D_100000.pth b/full_models/hlb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..70b2fa395df6fe3d9afb5e6a2f390d54e1975eed --- /dev/null +++ b/full_models/hlb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c0b9d8538db4dbaf30774a1ef545bf0ada48bdce8d0c4338b8ae67edc4ca948 +size 561078852 diff --git a/full_models/hlb/G_100000.pth b/full_models/hlb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e3e952b4afc33e29be3f37772960d3f40ee92a70 --- /dev/null +++ b/full_models/hlb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a149c198ce8f4e35bf41872c7b3778de336f26d17dcc82c21ebbe6afbc7b04c +size 436411362 diff --git a/full_models/hlb/config.json b/full_models/hlb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hlb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hlb/vocab.txt b/full_models/hlb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..30b96237411c440dd4b62eff36c177579097a13b --- /dev/null +++ b/full_models/hlb/vocab.txt @@ -0,0 +1,51 @@ +ड +़ +_ +ल +ु +ज +ि +स +ई +उ +फ +अ +थ +घ +झ +े +' +व +आ +य +न +ए +त +ू +ट +ख +- +क +ो +ध +ढ +ं +र +ब +म +प +ऊ +ग +ठ + +ा +च +इ +छ +ह +द +ओ +‍ +भ +ी +् diff --git a/full_models/hlt/D_100000.pth b/full_models/hlt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d00b3cc5ab85f5f7e525b7b09b90287c74ee6bea --- /dev/null +++ b/full_models/hlt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c70d647c10ee14fb32999cd28d10936c3aebe40944251be2f8b386e5cf72dff +size 561079011 diff --git a/full_models/hlt/G_100000.pth b/full_models/hlt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..26447c56a37d458262df8a547f83cfc1579efc25 --- /dev/null +++ b/full_models/hlt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a62831b5d14fb684892743260566bc4646c2c46652c96763bf93d9b0c70c406c +size 436359230 diff --git a/full_models/hlt/config.json b/full_models/hlt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hlt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hlt/vocab.txt b/full_models/hlt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4f6a1207358848fc01a964e66b278c04cb782436 --- /dev/null +++ b/full_models/hlt/vocab.txt @@ -0,0 +1,28 @@ +r +y +u +o +m +v +g +i +h +s +n +e +d +l +w +z + +_ +k +' +- +t +c +f +a +j +b +p diff --git a/full_models/hne/D_100000.pth b/full_models/hne/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..64a201d104102404b78ea1cc0c4e3e507f9af5cc --- /dev/null +++ b/full_models/hne/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2d0650df3296f80f732f3c8e2b43fb900988b7e1db81f9a6bfe8aa7d1010db1 +size 561079095 diff --git a/full_models/hne/G_100000.pth b/full_models/hne/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..57f41127c9b1c7b2664915a38310a321240a9daf --- /dev/null +++ b/full_models/hne/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2430351df4e507499f4929cb71b0a96d91ae0565aff46d879da2f8de7c898e2 +size 436436056 diff --git a/full_models/hne/config.json b/full_models/hne/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hne/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hne/vocab.txt b/full_models/hne/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8542c0b9c55a9c8a4785844cc72a4fdd0b793268 --- /dev/null +++ b/full_models/hne/vocab.txt @@ -0,0 +1,61 @@ +| +ा +र +े +क +न +म +ह +स +ि +ल +त +ं +ब +प +य +ी +व +ो +अ +ज +द +ु +ऊ +ओ +ू +ग +ख +ए +् +च +इ +थ +आ +भ +ई +ड +ध +घ +़ +ट +‍ +छ +ठ +झ +उ +- +फ +ढ +ौ +ै +ः +– +' +6 +4 +0 +5 +3 +ृ + diff --git a/full_models/hnn/D_100000.pth b/full_models/hnn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d9a6c1572159667b5f2f4e3c00c2cefa258b79e5 --- /dev/null +++ b/full_models/hnn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ac12337862d2440054f81432ec79edc73fe5043431de83ae1bf77b5dcd1571 +size 561078873 diff --git a/full_models/hnn/G_100000.pth b/full_models/hnn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dab5d2ce6e6de0b3d5be22a0213d74fab67cc7bc --- /dev/null +++ b/full_models/hnn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61994d344c5c771ea55d49361df52624cadf0dc094c4883ef51c61b65eb6934f +size 436341341 diff --git a/full_models/hnn/config.json b/full_models/hnn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hnn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hnn/vocab.txt b/full_models/hnn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fb55d824eee124740da569acaa9494b353bc11d6 --- /dev/null +++ b/full_models/hnn/vocab.txt @@ -0,0 +1,21 @@ +- +p +s +d +h +i + +b +m +u +a +r +g +_ +' +y +w +k +l +n +t diff --git a/full_models/hns/D_100000.pth b/full_models/hns/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9499b26319069553ad3b17fbeb28b21b67a185b6 --- /dev/null +++ b/full_models/hns/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:914ced33fe573de0501384304c43e866e75c8a8af8a7739daf23e44f0c2d1739 +size 561109884 diff --git a/full_models/hns/G_100000.pth b/full_models/hns/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6eaba38b7fad44d7704f18c3d6e5c4eaa6c96d79 --- /dev/null +++ b/full_models/hns/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ddac7b82d6aa484701b0c744c2522bdccbd66ecdf950cd3e4cb5388223f785d +size 436595353 diff --git a/full_models/hns/config.json b/full_models/hns/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hns/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hns/vocab.txt b/full_models/hns/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..86cdfd81e6c28676646f0e23bfaa09f7a1ec73f3 --- /dev/null +++ b/full_models/hns/vocab.txt @@ -0,0 +1,30 @@ +a +| +e +i +k +h +o +r +t +s +b +l +n +d +m +j +g +p +w +u +- +f +' +y +é +ó +á +z +í + diff --git a/full_models/hoc/D_100000.pth b/full_models/hoc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..60ccbfe12f5bbbbfabcef9590d4150d39c9d8e88 --- /dev/null +++ b/full_models/hoc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac0c8746e2cf5361f875a9c305c7b42b90254ddd40a13ef3e2a78ee484deace +size 561078861 diff --git a/full_models/hoc/G_100000.pth b/full_models/hoc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20425421a794109a3038396e33127b99920544be --- /dev/null +++ b/full_models/hoc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5c8f200852224370f2e70283f00168d6a6d3e87d4df085da48be26d985a551 +size 436418104 diff --git a/full_models/hoc/config.json b/full_models/hoc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hoc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hoc/vocab.txt b/full_models/hoc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4ead993bd21b3785a2aac96bd155e348207cc587 --- /dev/null +++ b/full_models/hoc/vocab.txt @@ -0,0 +1,55 @@ +ଟ +ଢ +ସ +ି +ଫ + +ମ +' +ଥ +- +୍ +ୃ +ୌ +ୈ +ନ +ତ +ୟ +ଞ +େ +– +ଃ +କ +ହ +ଅ +ଶ +ଡ +ଂ +ଖ +ଇ +ଣ +ଙ +ଉ +ଭ +‍ +ଁ +ୀ +— +ୋ +ର +_ +ଦ +ୱ +i +ୁ +ଆ +ଚ +ା +ବ +ପ +ଳ +ଲ +ଏ +ଗ +ଜ +4 diff --git a/full_models/hoy/D_100000.pth b/full_models/hoy/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..71a228a3165d78f5ad3834f05a8c5b10e192d343 --- /dev/null +++ b/full_models/hoy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f85d618eb3ad66ac952f949513d89e1bcbfd179541f51e36f7c7cfd42fff43f3 +size 561075952 diff --git a/full_models/hoy/G_100000.pth b/full_models/hoy/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f178f38f2a0cad2badacfd01d8a3411bdbf88ccb --- /dev/null +++ b/full_models/hoy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee87aa77b55f87fb082951068a5e3977fd1cede88a50513e4468d6b893293e1 +size 436412061 diff --git a/full_models/hoy/config.json b/full_models/hoy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hoy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hoy/vocab.txt b/full_models/hoy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8b89cef23634d48ae3b6ca0336b2aa7c1accee7e --- /dev/null +++ b/full_models/hoy/vocab.txt @@ -0,0 +1,61 @@ +| +ा +द +र +न +ु +क +ी +् +त +स +य +ि +ळ +म +आ +ो +े +ं +अ +ग +ल +व +ह +प +ट +ब +ई +श +ऊ +ज +च +इ +उ +‍ +ू +भ +ड +ध +ख +ढ +ॉ +घ +ण +ै +फ +ौ +थ +- +ठ +ष +ओ +छ +औ +झ +ए +़ +ृ +ँ +' + diff --git a/full_models/hto/D_100000.pth b/full_models/hto/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bea12ca51c6c3814a74b91f621d51ea0f873b696 --- /dev/null +++ b/full_models/hto/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ac890f37a9b645a635c6bc1f9cc29e7a12a2afccbd353056229652690ddc286 +size 561109899 diff --git a/full_models/hto/G_100000.pth b/full_models/hto/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7aaa7a29cbff2822412ca95c7edf0b85bae1d022 --- /dev/null +++ b/full_models/hto/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce62d77d7bd60b38fc7549c28f5841d4811383ab605c26f706cc84f6ead4fc8 +size 436617478 diff --git a/full_models/hto/config.json b/full_models/hto/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hto/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hto/vocab.txt b/full_models/hto/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..140990cbbde79ca4e83cf494a64d236656fd14db --- /dev/null +++ b/full_models/hto/vocab.txt @@ -0,0 +1,39 @@ +| +a +ù +e +i +o +n +m +u +d +c +l +r +f +j +í +t +á +z +ó +ñ +b +é +à +g +s +ú +p +h +v +ü +k +q +' +y +` +x +- + diff --git a/full_models/hub/D_100000.pth b/full_models/hub/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6ce122e400c0b641b921ff2a0c0b092e84b03ac0 --- /dev/null +++ b/full_models/hub/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f58f0ba7635d4b57f11e77923d454befbe4f0f87bab1c2d6ad16d75b53d9362 +size 561109897 diff --git a/full_models/hub/G_100000.pth b/full_models/hub/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3a404b3466e3068b84808e5c0b160e27349e6cc5 --- /dev/null +++ b/full_models/hub/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b413e826409c8f39d744a413bf06ae00b17eb88a2f4fb1c9a2ecc080d0ad6c1b +size 436606887 diff --git a/full_models/hub/config.json b/full_models/hub/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hub/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hub/vocab.txt b/full_models/hub/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7b5459a5309e2f59b1bedc0638ce7931876ab083 --- /dev/null +++ b/full_models/hub/vocab.txt @@ -0,0 +1,35 @@ +a +| +i +u +n +t +k +m +s +r +e +h +c +j +w +p +y +g +o +l +ú +d +í +b +á +é +v +f +ó +z +' +q +x +ñ + diff --git a/full_models/hui/D_100000.pth b/full_models/hui/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d545fc4ea72999a10ed6df35c4903058de1d7f38 --- /dev/null +++ b/full_models/hui/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c1cb07b0716d990bcf75ca9e9ed272247f513c7e92f2242cc9d4d22cd8ad97 +size 561108347 diff --git a/full_models/hui/G_100000.pth b/full_models/hui/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7791306887ea0f6c622fd10bb073414f4e04b685 --- /dev/null +++ b/full_models/hui/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35a1dcee7f23134f2e29d5b0ee0b4d1ec46ae31fe8811a9ecdeec344e713dc6e +size 436585239 diff --git a/full_models/hui/config.json b/full_models/hui/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hui/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hui/vocab.txt b/full_models/hui/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a5559d9a0429b00bada1c1879e686ded97cc01a6 --- /dev/null +++ b/full_models/hui/vocab.txt @@ -0,0 +1,27 @@ +a +| +i +n +o +e +g +b +l +u +h +m +d +r +w +t +y +k +p +s +í +̱ +̠ +á +- +é + diff --git a/full_models/hun/D_100000.pth b/full_models/hun/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2af969de0a7591039eeeedf30d7b25d4bd5d4d62 --- /dev/null +++ b/full_models/hun/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c687407a1ca0bf9757441ec05fd83c5e1b22545b189308a46c9809fb7a04f1c +size 561110761 diff --git a/full_models/hun/G_100000.pth b/full_models/hun/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3326e699ad7432fdb519632053e95f739271234d --- /dev/null +++ b/full_models/hun/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f040bc9ff1814bed0c33232686f313ce923a093b204e77418a2ca791ecc3cf4e +size 436618514 diff --git a/full_models/hun/config.json b/full_models/hun/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hun/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hun/vocab.txt b/full_models/hun/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..2fb4545b7d92e0110034e011c6a2976f6d4413a3 --- /dev/null +++ b/full_models/hun/vocab.txt @@ -0,0 +1,37 @@ +r +t +l +ó +- +e +k +i +y +í + +b +d +é +h +z +p +n +ö +a +j +ő +u +ü +o +v +c +g +_ +á +ú +x +s +m +ű +f +– diff --git a/full_models/hus-dialect_centralveracruz/D_100000.pth b/full_models/hus-dialect_centralveracruz/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..743cf9c6da74371d033cbb6f583de206ebdf1905 --- /dev/null +++ b/full_models/hus-dialect_centralveracruz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0b106ae5b3798d33efa1353427fbafef75a09faae4aefe8a00cdbbcff7d45c +size 561078470 diff --git a/full_models/hus-dialect_centralveracruz/G_100000.pth b/full_models/hus-dialect_centralveracruz/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..e2d055ff4b40af6c87ca4eb78cd5287c59df6b42 --- /dev/null +++ b/full_models/hus-dialect_centralveracruz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3dc7c0e41293b8061a972fcb3bc298ee1fdaa77dcac2a2678d3173108e1d039 +size 436359892 diff --git a/full_models/hus-dialect_centralveracruz/config.json b/full_models/hus-dialect_centralveracruz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/hus-dialect_centralveracruz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hus-dialect_centralveracruz/vocab.txt b/full_models/hus-dialect_centralveracruz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..91c9391e43d07c5e38280f522b6f4e51ba137bdb --- /dev/null +++ b/full_models/hus-dialect_centralveracruz/vocab.txt @@ -0,0 +1,30 @@ +| +a +i +t +n +k +l +j +e +s +b +h +o +u +x +c +w +m +y +d +p +r +— +g +f +á +ó +ß +œ + diff --git a/full_models/hus-dialect_westernpotosino/D_100000.pth b/full_models/hus-dialect_westernpotosino/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..25804adf3abce9d8ebd3058adfd3360ea1ec701b --- /dev/null +++ b/full_models/hus-dialect_westernpotosino/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:171f23371a8fe5daf1ca502c239ff63cdee9613a195b3614ea492eda30f2b822 +size 561078879 diff --git a/full_models/hus-dialect_westernpotosino/G_100000.pth b/full_models/hus-dialect_westernpotosino/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..faff53bbdf9e2882e998a191253d18c90d27d6d8 --- /dev/null +++ b/full_models/hus-dialect_westernpotosino/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94c8b1344b42fabefa4dd155daa0f7465e44b3063680bbe137a62fcac5e1eae3 +size 436397232 diff --git a/full_models/hus-dialect_westernpotosino/config.json b/full_models/hus-dialect_westernpotosino/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hus-dialect_westernpotosino/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hus-dialect_westernpotosino/vocab.txt b/full_models/hus-dialect_westernpotosino/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e67edc0c640d80eb20994ba96fd929848a244916 --- /dev/null +++ b/full_models/hus-dialect_westernpotosino/vocab.txt @@ -0,0 +1,45 @@ +4 +é +b +' +á +ñ +_ +j + +k +í +6 +ó +f +d +v +ú +r +t +7 +e +u +a +2 +w +0 +3 +p +h +s +g +9 +n +5 +à +i +x +1 +z +- +o +m +y +c +l diff --git a/full_models/huu/D_100000.pth b/full_models/huu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ffe4c5f819af1bb9853a534185083cb17031f957 --- /dev/null +++ b/full_models/huu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28bacdb906c1c38165196c1609632d1c434cae17e3821d324189b8b1eb4bdc01 +size 561078635 diff --git a/full_models/huu/G_100000.pth b/full_models/huu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7cb1e23ca0e11befafca0ff1258bb55067ca1c5 --- /dev/null +++ b/full_models/huu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d7c8afc1f2fb70092a73872f9f3bb055763655d723b00b1aa7d3e2de6c47cb +size 436378001 diff --git a/full_models/huu/config.json b/full_models/huu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/huu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/huu/vocab.txt b/full_models/huu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3c2ace5c06fa76c389591c6be0cef5f244c638b6 --- /dev/null +++ b/full_models/huu/vocab.txt @@ -0,0 +1,37 @@ +ñ +r +a +_ +z +g +u +n +q +c +ɨ +k +í +p +h +b +x + +j +— +é +i +f +t +d +- +ó +o +e +v +y +ú +' +s +l +m +á diff --git a/full_models/huv/D_100000.pth b/full_models/huv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf05d08c4d15e6a4086b47a3f595f63cb7190309 --- /dev/null +++ b/full_models/huv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eece8354dcc2ee4619eadaebc089907082a4b4088f8f32dff315067755deca1e +size 561109862 diff --git a/full_models/huv/G_100000.pth b/full_models/huv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..80bbce27b6619831d4e278722027d6d55193073e --- /dev/null +++ b/full_models/huv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2334276368296d08998f04f2ae9d94d64f4af00e495d8c49ea300d0eb5bc586c +size 436611395 diff --git a/full_models/huv/config.json b/full_models/huv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/huv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/huv/vocab.txt b/full_models/huv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1d809cf1a486d4b8744aa5e5a6d07f1b4661411e --- /dev/null +++ b/full_models/huv/vocab.txt @@ -0,0 +1,37 @@ +| +a +n +i +e +t +ü +m +j +o +w +c +l +s +g +y +p +d +u +r +x +q +b +h +á +í +ú +ó +é +f +ǘ +v +z +ñ +k +1 + diff --git a/full_models/hvn/D_100000.pth b/full_models/hvn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..95d03583758a4a767a8239d53dd137fa13d94667 --- /dev/null +++ b/full_models/hvn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10d60fa61315daffb248e248ba4c6e69eb63234b7378b0fe1a0e7fa2ff6e4a43 +size 561076019 diff --git a/full_models/hvn/G_100000.pth b/full_models/hvn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91350e07aeab237bff73007d4db49bed3be4b34c --- /dev/null +++ b/full_models/hvn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c539eba6d8b2234bf6e649d4ddad8c851c3749f74336902f16f9fa5e6c358c6 +size 436333649 diff --git a/full_models/hvn/config.json b/full_models/hvn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hvn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hvn/vocab.txt b/full_models/hvn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..25ab9864721cf6c387b8056c5f7c9f770d4134b7 --- /dev/null +++ b/full_models/hvn/vocab.txt @@ -0,0 +1,27 @@ +e +a +s +' + +g +d +r +ó +o +j +f +w +p +_ +l +- +u +n +è +i +b +h +m +k +t +y diff --git a/full_models/hwc/D_100000.pth b/full_models/hwc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aa699809342ebf31d6bda67658842917793b9d3c --- /dev/null +++ b/full_models/hwc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250600c435c071fe8ff73a1e73fd26d2e3bbc7c7435b62b8e00271450c42438d +size 561078721 diff --git a/full_models/hwc/G_100000.pth b/full_models/hwc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..508be9da46579f753e628c920fb19c4cb358ba7a --- /dev/null +++ b/full_models/hwc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feeb1e2538650a9d662ef2a3e146166d5f068f299b560caebe179c82f89714d1 +size 436378149 diff --git a/full_models/hwc/config.json b/full_models/hwc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hwc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hwc/vocab.txt b/full_models/hwc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b07dba3f802b5d762098009c7b6c53bc3dc7994f --- /dev/null +++ b/full_models/hwc/vocab.txt @@ -0,0 +1,38 @@ +5 +j +r +z +w +s +4 +_ +h +n +t +i +o +b +m +c +x +k +q +e +- +l +f +d +y +a +— +' +0 +p +v +6 + +u +g +1 +7 +2 diff --git a/full_models/hyw/D_100000.pth b/full_models/hyw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a2d6867f44dce95131b02aeeace8196b610e37c9 --- /dev/null +++ b/full_models/hyw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22de9258818a95bd7ff66185f139e7afef2b92f851cdf5ea8b1172a7bfd58233 +size 561078731 diff --git a/full_models/hyw/G_100000.pth b/full_models/hyw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fc0ba3f988e90a5a41fba35b71b82801851fa3eb --- /dev/null +++ b/full_models/hyw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c5336503869af94f480d42108f0c43039c8bb2a97f6c64c6aad26ab0d27aeb1 +size 436387946 diff --git a/full_models/hyw/config.json b/full_models/hyw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/hyw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/hyw/vocab.txt b/full_models/hyw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d77241923fcc8908fa005706f83600af1ab46842 --- /dev/null +++ b/full_models/hyw/vocab.txt @@ -0,0 +1,41 @@ +է +ր +ծ +հ +զ +ֆ +_ +ղ +կ +գ +դ +ւ +ի +պ +օ +ս +ք +չ +ն +ա +ճ +լ +ռ +վ +թ +ձ +տ +խ +բ +շ +ո +փ +' +մ +ց + +ը +ե +յ +ժ +ջ diff --git a/full_models/iba/D_100000.pth b/full_models/iba/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2641f1adccfa0cf8e4f0b49e2f63d113bfb9df9a --- /dev/null +++ b/full_models/iba/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d15bb0ec09341c62775137c453ee4540b4865f98f9b16b3caf1d93bfd36bbde +size 561110102 diff --git a/full_models/iba/G_100000.pth b/full_models/iba/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c67b11524860c94d704bdc70de5e96a4f060a2f0 --- /dev/null +++ b/full_models/iba/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a337fc597bfda1a3a4af217f705d3da60e674714bdd0c3f55154e90e90af14c +size 436595314 diff --git a/full_models/iba/config.json b/full_models/iba/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/iba/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/iba/vocab.txt b/full_models/iba/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e376906bf3c1f6699e2a1fe81381461f5a0f7e91 --- /dev/null +++ b/full_models/iba/vocab.txt @@ -0,0 +1,29 @@ +a +| +i +n +u +e +k +g +t +l +d +s +m +r +b +h +y +p +j +o +w +c +- +v +0 +3 +5 +2 + diff --git a/full_models/icr/D_100000.pth b/full_models/icr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c49de3b219f9157b12e79443404e80e5bbbf50db --- /dev/null +++ b/full_models/icr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d1b5021da120fc5e58e43f6e98946ba64e384e46c858449dccde023b20ad1f8 +size 561079019 diff --git a/full_models/icr/G_100000.pth b/full_models/icr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4aa8737cb1278e961748845996946d4c84f3f29 --- /dev/null +++ b/full_models/icr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2731f9df452c9ccc33090e6e3c77017ef4f3694e3f4af0140d6e614a448153f8 +size 436375843 diff --git a/full_models/icr/config.json b/full_models/icr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/icr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/icr/vocab.txt b/full_models/icr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c8df2f81bac20d51aa0917d75493b6852a4ef837 --- /dev/null +++ b/full_models/icr/vocab.txt @@ -0,0 +1,35 @@ +n +x +p +s +q +k +w +l +f +e +2 +0 +1 +m +z +c +- +o +u + +i +' +a +h +t +b +v +9 +r +j +— +_ +d +g +y diff --git a/full_models/idd/D_100000.pth b/full_models/idd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2145ed111822fc351c4817f5d4b763d2c07842fe --- /dev/null +++ b/full_models/idd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd243343e144bb08ea1c95343d5daa8a395f58685d8571a96b0e8771fbad0a15 +size 561078846 diff --git a/full_models/idd/G_100000.pth b/full_models/idd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..12636e04cdbcd844f9eacfd2575d565f601f1f27 --- /dev/null +++ b/full_models/idd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a675ce4132d73b7931593a73be23a4dc3eb4ebe788693f88e19eb3935ce33b +size 436385477 diff --git a/full_models/idd/config.json b/full_models/idd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/idd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/idd/vocab.txt b/full_models/idd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d22e0dbf95fae66c6f1bfd248e92a3f843de57ef --- /dev/null +++ b/full_models/idd/vocab.txt @@ -0,0 +1,40 @@ +p +ì +é +ḿ +d + +è +n +í +r +o +ɔ +ǹ +l +ò +ɛ +u +ú +ù +ó +́ +j +m +k +s +w +i +g +_ +a +h +' +y +à +f +b +e +t +̀ +á diff --git a/full_models/ifa/D_100000.pth b/full_models/ifa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ba0989b75156349f359315cfb3820f98bb8316a --- /dev/null +++ b/full_models/ifa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a25ea99f9c314bd669ca4a53211fb30462622bd13b7739e698e61d4e5af20a6 +size 561079096 diff --git a/full_models/ifa/G_100000.pth b/full_models/ifa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ce69d441f40f33ff74885f93130018d87ba25e3a --- /dev/null +++ b/full_models/ifa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01e1cbff9e1c9d20ecb2a094a869646f6e8bece0afbeca429a4d256ff741de85 +size 436360688 diff --git a/full_models/ifa/config.json b/full_models/ifa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ifa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ifa/vocab.txt b/full_models/ifa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..53f481d284d5c1741fb82af0c1e90b0fa6dda8a5 --- /dev/null +++ b/full_models/ifa/vocab.txt @@ -0,0 +1,29 @@ +h +n +t +- +g +v +e +x +w +s +l +c +i +' +f +z +j +m +o +a +y + +p +b +k +u +d +r +_ diff --git a/full_models/ifb/D_100000.pth b/full_models/ifb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf7c601cfadd6bd29257b6ffdded262c4dc73bf2 --- /dev/null +++ b/full_models/ifb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed997cec4718b21c19c4c83e4bda0e5fb1e11b5eb9918e645e05869064409b0a +size 561110015 diff --git a/full_models/ifb/G_100000.pth b/full_models/ifb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..57055251fbce52a4c5a507eb65d506147676bea9 --- /dev/null +++ b/full_models/ifb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b03262b5b2c8943b659b99378d1e9bbb50ab252b14841fcecd52552d9014210 +size 436595339 diff --git a/full_models/ifb/config.json b/full_models/ifb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ifb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ifb/vocab.txt b/full_models/ifb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..eb9ebc62095f361e4984f891a7c9c8f76a5abbf2 --- /dev/null +++ b/full_models/ifb/vocab.txt @@ -0,0 +1,30 @@ +| +a +n +i +u +d +y +h +t +m +o +g +l +p +' +b +e +s +w +k +r +j +c +v +z +f +x +- +q + diff --git a/full_models/ife/D_100000.pth b/full_models/ife/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eb90e946fee1f2aa8a5878ff0b412078f092a022 --- /dev/null +++ b/full_models/ife/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67dcc0b9e07776aeac8334f03b9a6eff3d22b263b0ffbfae936b0e01f7082a87 +size 561079106 diff --git a/full_models/ife/G_100000.pth b/full_models/ife/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..17a59ad248fae08af19d2a47fe6f5a5cc723b697 --- /dev/null +++ b/full_models/ife/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7af1d1f3fa1d46ead0a0ebf416071785ee8548c61732537381e406a4d653e54 +size 436405173 diff --git a/full_models/ife/config.json b/full_models/ife/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ife/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ife/vocab.txt b/full_models/ife/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..84820c532e1bdc7f63fa3d645231bb66dd4a400c --- /dev/null +++ b/full_models/ife/vocab.txt @@ -0,0 +1,49 @@ +y +o +s +z +ǹ +d +t +e +̃ +ɖ +ĩ +ì +á +h +é +a +́ +m +w +ó +_ +ŋ +f +ń +à +ã +ɔ +g +l +ũ +̀ +b +ò +k +í +u +ú +r +ɛ +ḿ +ṹ + +è +p +‐ +n +- +ù +i diff --git a/full_models/ifk/D_100000.pth b/full_models/ifk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0e0d33b02cfca5354612bfd2ecb5b13dbc1f2b76 --- /dev/null +++ b/full_models/ifk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6746dc019c2762c3ed6fa47042d9eda0741ccd668b36cd99840a81d3d3b1273f +size 561109471 diff --git a/full_models/ifk/G_100000.pth b/full_models/ifk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d3e4a6508d8904bf7b6360db64f0e9c1e54e9291 --- /dev/null +++ b/full_models/ifk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a45204dcd0b0ded3ea3d07a772f5fb2552278d4c1591c22470b78e49351c9da7 +size 436604303 diff --git a/full_models/ifk/config.json b/full_models/ifk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ifk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ifk/vocab.txt b/full_models/ifk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9d1122f3f96ffaf07533df45d35a4ef746b6762e --- /dev/null +++ b/full_models/ifk/vocab.txt @@ -0,0 +1,34 @@ +| +a +n +i +u +d +t +y +h +o +m +k +g +l +e +p +b +s +- +w +r +j +c +` +' +f +v +z +x +q +1 +9 +7 + diff --git a/full_models/ifu/D_100000.pth b/full_models/ifu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..60a1108b7452734a9118432c84fb8cfd899e750d --- /dev/null +++ b/full_models/ifu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893d021d659535b9b943bbd13b586ea51d1baf5f8a8af9d88e489e6436c0e624 +size 561109882 diff --git a/full_models/ifu/G_100000.pth b/full_models/ifu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f053c417e8e5e1fe72997eaaebeb02e7229edf1 --- /dev/null +++ b/full_models/ifu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec364fe8c96662d39e0c9c4fb3b04231868ac2df93c354d89bbf0e5639accc4 +size 436595354 diff --git a/full_models/ifu/config.json b/full_models/ifu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ifu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ifu/vocab.txt b/full_models/ifu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0b8701c33ca0fb5e4bbc724ec2516507bd83a5b2 --- /dev/null +++ b/full_models/ifu/vocab.txt @@ -0,0 +1,30 @@ +| +a +n +h +i +u +o +t +m +p +c +j +g +y +l +k +e +- +s +d +r +f +' +w +b +v +z +x +á + diff --git a/full_models/ify/D_100000.pth b/full_models/ify/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4193e828374940aa338845f2d260a613509babf7 --- /dev/null +++ b/full_models/ify/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4b92966f5c1c21148fc5501a7e12002c23f81a29c73e36dab2495354d475e3 +size 561109582 diff --git a/full_models/ify/G_100000.pth b/full_models/ify/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5bd78301af5aab8393b2ecfb12109c1ab8954965 --- /dev/null +++ b/full_models/ify/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:655bfd87625657c8fb5f1dfebf51216ec8601ec8a6ac72d570372350714c357a +size 436595334 diff --git a/full_models/ify/config.json b/full_models/ify/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ify/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ify/vocab.txt b/full_models/ify/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..040678057ebe77ea271bfd180c34c6b009ede1f8 --- /dev/null +++ b/full_models/ify/vocab.txt @@ -0,0 +1,30 @@ +| +a +n +e +i +u +d +t +g +m +h +y +l +k +p +- +s +b +w +o +j +r +c +' +v +f +z +x +q + diff --git a/full_models/ign/D_100000.pth b/full_models/ign/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c6b43bbed5a8aa1a22470b413472005f559a3f2b --- /dev/null +++ b/full_models/ign/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96585f4116311a12ff55b68d81e385db50d5ee2cf4a342507df9e3714372062 +size 561109857 diff --git a/full_models/ign/G_100000.pth b/full_models/ign/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cffa593e26570decc7f429da6bdfb51094d7ff1c --- /dev/null +++ b/full_models/ign/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41008b75baaadf028e51e5252cfc9a29ab37df892eaad783c42e8c206624150d +size 436625210 diff --git a/full_models/ign/config.json b/full_models/ign/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ign/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ign/vocab.txt b/full_models/ign/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cb1014c85910a108e6775378e9470cb4d8d2afba --- /dev/null +++ b/full_models/ign/vocab.txt @@ -0,0 +1,43 @@ +a +| +i +e +t +n +r +' +u +k +m +p +s +c +w +h +á +y +j +v +é +í +o +ú +l +ñ +d +b +– +g +f +ó +z +q +- +x +0 +1 +4 +9 +2 +3 + diff --git a/full_models/ikk/D_100000.pth b/full_models/ikk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f70d76502ee47992c59026fa327c0e1531ac7704 --- /dev/null +++ b/full_models/ikk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97048ff4542b5935b2c6c84bf417a8dfa8bfc4edbd08471f39fb61e643ddd5cb +size 561079251 diff --git a/full_models/ikk/G_100000.pth b/full_models/ikk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a908fca9efd1554e864339e534134a89b54ecef8 --- /dev/null +++ b/full_models/ikk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:227d1bcd1f2c87107c3d34ada6cae2fc70d9d8a22962f082ae10d988cb7303af +size 436379910 diff --git a/full_models/ikk/config.json b/full_models/ikk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ikk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ikk/vocab.txt b/full_models/ikk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4998fe9142e1483a74bcf67953a52480d69d3516 --- /dev/null +++ b/full_models/ikk/vocab.txt @@ -0,0 +1,36 @@ +r +t +' +a +h +k +n +ụ +- +b +ị + +i +w +ù +̀ +m +o +e +c +s +y +_ +z +l +ò +v +g +d +ẹ +u +f +p +ṅ +j +ọ diff --git a/full_models/ilb/D_100000.pth b/full_models/ilb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..da759d34c8c4b6f2023c0b85a1c4014c5e886a75 --- /dev/null +++ b/full_models/ilb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cc47d711f0530de2e67eb09a0540634b6509662b97d54cdcf35cbc7d2c58480 +size 561079477 diff --git a/full_models/ilb/G_100000.pth b/full_models/ilb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cac6ccc901c65dbc315ce9be86ac726988890a2d --- /dev/null +++ b/full_models/ilb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00fc151ef22325a7e7072622487fbb18b3a268fc75b380c2a7cc3d7c912d9dec +size 436361490 diff --git a/full_models/ilb/config.json b/full_models/ilb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ilb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ilb/vocab.txt b/full_models/ilb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8d212c3ed539cf3aa0ffbc4d11e8341c0c748f8e --- /dev/null +++ b/full_models/ilb/vocab.txt @@ -0,0 +1,28 @@ +m +ŋ +l +e +z + +n +c +u +' +w +s +d +f +i +y +p +h +- +j +a +t +b +_ +o +k +v +g diff --git a/full_models/ilo/D_100000.pth b/full_models/ilo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..94635379d2228a671fccd505feac047ac4a96fd4 --- /dev/null +++ b/full_models/ilo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1728770961475ee233d173f74032a32e0c8624f1d9e5e5ef62f593ff72d089 +size 561109966 diff --git a/full_models/ilo/G_100000.pth b/full_models/ilo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1f540e2eb1052825d88176416a2a741b1620cb8 --- /dev/null +++ b/full_models/ilo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8310374fbd590887a31cc23cc022e47d64e2d87a1cce152d41ddd0a3428d79dc +size 436623903 diff --git a/full_models/ilo/config.json b/full_models/ilo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ilo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ilo/vocab.txt b/full_models/ilo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0bad933fc219169e649ceb09c2be977209273b4e --- /dev/null +++ b/full_models/ilo/vocab.txt @@ -0,0 +1,41 @@ +a +| +i +n +t +g +k +d +o +s +m +e +u +p +y +l +r +b +w +j +- +c +h +f +— +v +z +0 +' +2 +1 +4 +x +3 +5 +6 +8 +7 +9 +q + diff --git a/full_models/imo/D_100000.pth b/full_models/imo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7781f5ae219aadb9b72daaebf76444ea56ebaff0 --- /dev/null +++ b/full_models/imo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7683abfd6c458358e0521f2b558ea7af81b92888d6c0682c92ed179302d3c88c +size 561075763 diff --git a/full_models/imo/G_100000.pth b/full_models/imo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b7b25f3ee306c106d9ff0d01b44a6dd299edbb99 --- /dev/null +++ b/full_models/imo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0526468ab9508272a176e95c8d15215ac6b06e54587f0b172f6ba5bb043b225 +size 436338593 diff --git a/full_models/imo/config.json b/full_models/imo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/imo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/imo/vocab.txt b/full_models/imo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fd75762861b2f580d7f528c4543aeae22ceef04b --- /dev/null +++ b/full_models/imo/vocab.txt @@ -0,0 +1,30 @@ +| +i +n +o +a +e +u +m +l +k +p +g +t +b +y +r +d +w +s +j +0 +f +v +h +1 +2 +5 +4 +' + diff --git a/full_models/inb/D_100000.pth b/full_models/inb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d978615785bae9b01681ce7d14d8b95becff6d2c --- /dev/null +++ b/full_models/inb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d01db5be084737a79b483147425bc2089280a04f9e316e49dd7ee624a8305b +size 561109892 diff --git a/full_models/inb/G_100000.pth b/full_models/inb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1b15b8e070dc74c2977e656567c201546fab6e88 --- /dev/null +++ b/full_models/inb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fed52ba435d2db5305b2c7450d35119aae3df30b774b4cafc3de4f5f0745f28c +size 436609175 diff --git a/full_models/inb/config.json b/full_models/inb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/inb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/inb/vocab.txt b/full_models/inb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..77d1e4d5b563e02a52f0d2e9f6cc222edf94c4bd --- /dev/null +++ b/full_models/inb/vocab.txt @@ -0,0 +1,36 @@ +a +| +i +­ +u +k +n +s +p +m +r +t +l +c +h +g +w +d +ñ +j +e +b +o +— +ú +á +í +é +f +z +v +ó +̈ +' +x + diff --git a/full_models/ind/D_100000.pth b/full_models/ind/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bb8b1a847bf5ea2859734d68fa2312f802b3e58c --- /dev/null +++ b/full_models/ind/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6de512c315a6aaf2f32bfb18c1b87bf4dbc0010b2c44bd3a3d6025c9ecf05d7 +size 561109754 diff --git a/full_models/ind/G_100000.pth b/full_models/ind/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cede66f5d1403d15a61f60b4d6b13c28b23f06ac --- /dev/null +++ b/full_models/ind/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32011b0d18bdb5a6b1fdaa461265a7e11d312860858c1477fa0d1756444231be +size 436606526 diff --git a/full_models/ind/config.json b/full_models/ind/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ind/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ind/vocab.txt b/full_models/ind/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..edf2720f81d6f6ca72ba49611f19a5e2f1cc34ee --- /dev/null +++ b/full_models/ind/vocab.txt @@ -0,0 +1,35 @@ +g +c +o + +— +' +t +n +i +_ +r +d +a +p +- +j +v +l +f +y +w +u +6 +s +h +k +z +0 +1 +5 +4 +e +b +2 +m diff --git a/full_models/iou/D_100000.pth b/full_models/iou/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f73f8578128c80bd0e7af53872bb875b0a6a1e2d --- /dev/null +++ b/full_models/iou/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:097806c094748fee886eba5dc5f5e32d4deeca2000ba664c9fbc31988b3e731b +size 561078707 diff --git a/full_models/iou/G_100000.pth b/full_models/iou/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7bf8ba3e6f33c5f78ee9efa19d0c45eb80c51ddf --- /dev/null +++ b/full_models/iou/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42ac155983927e8d962588dbd123eec1fc5c6e1edcc63f196fe2d14346c1323c +size 436378041 diff --git a/full_models/iou/config.json b/full_models/iou/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/iou/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/iou/vocab.txt b/full_models/iou/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3269414e0c3c3b9a95c149259bebd24bb2430a35 --- /dev/null +++ b/full_models/iou/vocab.txt @@ -0,0 +1,38 @@ +9 +1 +p +4 +e +i +n +5 +l +s +8 +f +ŋ +j +b +h +r + +a +g +3 +ä +0 +t +o +v +- +k +y +' +m +d +w +6 +u +2 +_ +7 diff --git a/full_models/ipi/D_100000.pth b/full_models/ipi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..69272787bb8e990464e31c3975b5d71302e357d6 --- /dev/null +++ b/full_models/ipi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60525181c117791dc1109de1f26cca29fd39d8255d2050419e8f79e55462ab5d +size 561106304 diff --git a/full_models/ipi/G_100000.pth b/full_models/ipi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..604e4bfa3883e7dfccf3ff32e321bc1d1c163fdc --- /dev/null +++ b/full_models/ipi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d985e6a3624f2749bcfb676dff8e69aa51aa85a183e9f81457e817dd6870692 +size 436555299 diff --git a/full_models/ipi/config.json b/full_models/ipi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ipi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ipi/vocab.txt b/full_models/ipi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..49cef3ee6b9e6e86437fb13eb8825b50074c998e --- /dev/null +++ b/full_models/ipi/vocab.txt @@ -0,0 +1,24 @@ +a +| +e +n +o +i +t +l +p +k +m +u +y +d +w +b +- +s +g +j +ŋ +0 +2 + diff --git a/full_models/iqw/D_100000.pth b/full_models/iqw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2885f5ee884d55ea7c34befedb4acc0a62d81fe9 --- /dev/null +++ b/full_models/iqw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36211d0f6fcc24af45de03f54d3ab783c93f014c5dbc952bcdd206fa90c93d3 +size 561078983 diff --git a/full_models/iqw/G_100000.pth b/full_models/iqw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dbfe1f50a383d64984e470d1a2a01755092b4b06 --- /dev/null +++ b/full_models/iqw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0fde04ec96e3e7acd7d0fd29531fc31583c297fa68c17b338b5bbfa99f99f6 +size 436398509 diff --git a/full_models/iqw/config.json b/full_models/iqw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/iqw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/iqw/vocab.txt b/full_models/iqw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cdd2ee0d9924573a68ce22245c155f9805f28d84 --- /dev/null +++ b/full_models/iqw/vocab.txt @@ -0,0 +1,46 @@ +ù +ị +u +j +p +ó +t +' +ú +ǹ +c +g +d +h +ẹ +o +̀ +s +ọ +y +á +ì +b + +ụ +- +r +l +é +n +a +z +w +í +v +m +6 +è +ò +f +i +́ +e +k +à +_ diff --git a/full_models/iri/D_100000.pth b/full_models/iri/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff3d810bcbf6290f50d33f139bf7cff3bc8b1ae8 --- /dev/null +++ b/full_models/iri/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f23a9f6f85620dbac35708f135659c101cb3dd3c11694e3fa3b9569049f984 +size 561078991 diff --git a/full_models/iri/G_100000.pth b/full_models/iri/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d9ea887486e3ff23c9b6777cd5de0c979b958e10 --- /dev/null +++ b/full_models/iri/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1158b9e102a99653e3044c831137339d20d189378c044edb416dc90c3a7a5f8a +size 436395278 diff --git a/full_models/iri/config.json b/full_models/iri/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/iri/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/iri/vocab.txt b/full_models/iri/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..022c9a309fdd85ab7cf0d2ad7a577ba5731841a3 --- /dev/null +++ b/full_models/iri/vocab.txt @@ -0,0 +1,43 @@ +̱ +s +z +p +y +- +ē +l +u +í +ê +n +t +d +f +ú +ā +a +ī +w +o +m + +g +î +_ +v +ó +â +è +á +3 +i +b +h +j +6 +e +é +' +k +c +r diff --git a/full_models/irk/D_100000.pth b/full_models/irk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c9fa564e8aee95504ff7ddadbf953a6047e02cb2 --- /dev/null +++ b/full_models/irk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fc7c5f98b820cc4812fec71be79777c741cd23b9fae688ebaa825c1bfe03e44 +size 561106382 diff --git a/full_models/irk/G_100000.pth b/full_models/irk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5676b4de30bd659074d07d33370f13035e2275e4 --- /dev/null +++ b/full_models/irk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fce9b4df60c4e15a307743054584c0909b22968df398dcb17e4c002489152305 +size 436576190 diff --git a/full_models/irk/config.json b/full_models/irk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/irk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/irk/vocab.txt b/full_models/irk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4e2674fd24bc2f95753a4e3df0e0ab761539842c --- /dev/null +++ b/full_models/irk/vocab.txt @@ -0,0 +1,33 @@ +| +a +i +e +r +n +u +o +s +á +m +h +l +t +g +k +w +' +d +í +y +ó +ú +b +é +q +x +f +p +c +j +z + diff --git a/full_models/isl/D_100000.pth b/full_models/isl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8163033d45316176eaf8b58fdcfcca792f7ba056 --- /dev/null +++ b/full_models/isl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6852f97335c0860bb45a323067813c508e91f0b28855a562afcdf3c23ad09c50 +size 561110513 diff --git a/full_models/isl/G_100000.pth b/full_models/isl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9b9516c230f4fd269fe82a3164f6c0a9675b640f --- /dev/null +++ b/full_models/isl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee04403fab907fc74b1fa540f3d16d5bd424931f941a71b0c95882a44490ff0c +size 436631959 diff --git a/full_models/isl/config.json b/full_models/isl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/isl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/isl/vocab.txt b/full_models/isl/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..310686c121c51f6bd2bce975d4f31e3b81f544cf --- /dev/null +++ b/full_models/isl/vocab.txt @@ -0,0 +1,43 @@ +5 +– + +f +ð +l +k +ó +o +a +_ +e +ú +á +3 +g +m +2 +u +p +é +æ +x +v +0 +- +7 +r +s +i +n +d +ý +1 +í +y +8 +b +h +t +þ +j +ö diff --git a/full_models/itl/D_100000.pth b/full_models/itl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..22d2d06555cc55bebeac9cd5fd75a21f5c66536c --- /dev/null +++ b/full_models/itl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ea13b5d5221d00f35e8f674a89406f1ed4ab09ab599292dac6afc5bd7f5ff2 +size 561076072 diff --git a/full_models/itl/G_100000.pth b/full_models/itl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3235feaa3236bc540a1e8c66c23ef7068f9d89c9 --- /dev/null +++ b/full_models/itl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd16216f9b87284df9539367d06162dd09c70f518e1137fcf984c971136535e +size 436382639 diff --git a/full_models/itl/config.json b/full_models/itl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/itl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/itl/vocab.txt b/full_models/itl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ed7ba7b53b05374dd4ea3db125665216d79798a6 --- /dev/null +++ b/full_models/itl/vocab.txt @@ -0,0 +1,48 @@ +э +ч +_ +ӑ +х +ы +и +ӈ +ӄ +ŏ +ɂ +– +р +м +љ +ў +с +ԓ +б +я +й +у + +ь +о +л +н +а +щ +ж +ӽ +2 +в +0 +к +ш +п +т +ʼ +ф +3 +г +з +1 +д +ә +њ +ц diff --git a/full_models/itv/D_100000.pth b/full_models/itv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..db8dec3b718595645a2ae677f6211ce72a1dc213 --- /dev/null +++ b/full_models/itv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba153446064f4cbc15f9e6b1fd1e93d6d88912f9faf1ec7086c8e2113b5a087a +size 561109230 diff --git a/full_models/itv/G_100000.pth b/full_models/itv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b8200b90ef24b3b1fbb4d467ddea830a9bb044d --- /dev/null +++ b/full_models/itv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b4fee844b39a22650a1a1fe1bd8fe35b75e831618256d1fbb7c6ece93d61a5 +size 436595354 diff --git a/full_models/itv/config.json b/full_models/itv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/itv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/itv/vocab.txt b/full_models/itv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ec3f9a8c646ca3abdacd7d3a60fcd1e2516a08a9 --- /dev/null +++ b/full_models/itv/vocab.txt @@ -0,0 +1,30 @@ +a +| +n +i +g +k +u +y +t +m +e +r +l +s +p +d +o +b +w +f +h +z +j +v +- +c +' +x +q + diff --git a/full_models/ixl-dialect_sangasparchajul/D_100000.pth b/full_models/ixl-dialect_sangasparchajul/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a0a1cc8a0fa359c986c3f57ef02e1d494382fb5a --- /dev/null +++ b/full_models/ixl-dialect_sangasparchajul/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bab1f90551a0b1f4b09ccdd7c06c5e8696a90db09a9bb529878242f5654e124 +size 561076193 diff --git a/full_models/ixl-dialect_sangasparchajul/G_100000.pth b/full_models/ixl-dialect_sangasparchajul/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be2dbc228aa36cb6a29a1122719f0c44626966f7 --- /dev/null +++ b/full_models/ixl-dialect_sangasparchajul/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a392a57961adf99ba1cd1bcc5b2efd502dde6c68933336251585ae50c2f9325 +size 436348835 diff --git a/full_models/ixl-dialect_sangasparchajul/config.json b/full_models/ixl-dialect_sangasparchajul/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ixl-dialect_sangasparchajul/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ixl-dialect_sangasparchajul/vocab.txt b/full_models/ixl-dialect_sangasparchajul/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3eb816d4d39f477be3bd39ff43501bfeae5fbb4e --- /dev/null +++ b/full_models/ixl-dialect_sangasparchajul/vocab.txt @@ -0,0 +1,33 @@ +v +u +d +x +s +b +i +r +6 +h +e +q +p +g +f +k +3 +4 +0 +l +- +a +z +c +ʼ +y +j + +m +t +_ +o +n diff --git a/full_models/ixl-dialect_sanjuancotzal/D_100000.pth b/full_models/ixl-dialect_sanjuancotzal/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1148963433e4f73f5536dd753f66e70ef27ca726 --- /dev/null +++ b/full_models/ixl-dialect_sanjuancotzal/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f896ee314b68ea77cae3970152710fdd05b6848c6cf36fbf413449cc15431c4c +size 561077465 diff --git a/full_models/ixl-dialect_sanjuancotzal/G_100000.pth b/full_models/ixl-dialect_sanjuancotzal/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ab29e1ebc67a897856612c01ed7cfaadd0ea957a --- /dev/null +++ b/full_models/ixl-dialect_sanjuancotzal/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ee581bff9d69e253aadc44ae5a989aebcbfeb2d9978e8be2be003cf8a58a8f +size 436377211 diff --git a/full_models/ixl-dialect_sanjuancotzal/config.json b/full_models/ixl-dialect_sanjuancotzal/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ixl-dialect_sanjuancotzal/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ixl-dialect_sanjuancotzal/vocab.txt b/full_models/ixl-dialect_sanjuancotzal/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cc15bdb20053d6fcc6cb54d8b68e6b521d21c544 --- /dev/null +++ b/full_models/ixl-dialect_sanjuancotzal/vocab.txt @@ -0,0 +1,42 @@ +| +a +' +t +i +u +e +l +n +o +h +k +s +x +z +c +j +m +q +b +v +y +p +r +— +d +g +0 +f +1 +4 +– +2 +3 +5 +6 +9 +7 +8 +ñ +- + diff --git a/full_models/ixl-dialect_santamarianebaj/D_100000.pth b/full_models/ixl-dialect_santamarianebaj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cd9be32f57ca16e8253619f85e943ad3195becf6 --- /dev/null +++ b/full_models/ixl-dialect_santamarianebaj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116346f004e5dfcc856fbcb649ca967840e077e8a2370bc198306d92a0adeb87 +size 561076166 diff --git a/full_models/ixl-dialect_santamarianebaj/G_100000.pth b/full_models/ixl-dialect_santamarianebaj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1f8c0f651d2b183e68c82733eb6e7e97337275c0 --- /dev/null +++ b/full_models/ixl-dialect_santamarianebaj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea479a98ab3ddc84d2efb4a32fb8a00b332c7ba86a8390318635358e645dcf1 +size 436369319 diff --git a/full_models/ixl-dialect_santamarianebaj/config.json b/full_models/ixl-dialect_santamarianebaj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ixl-dialect_santamarianebaj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ixl-dialect_santamarianebaj/vocab.txt b/full_models/ixl-dialect_santamarianebaj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2be6eb230d333077439a24ad6ff68df929b2af04 --- /dev/null +++ b/full_models/ixl-dialect_santamarianebaj/vocab.txt @@ -0,0 +1,42 @@ +| +a +' +t +e +u +i +l +n +k +s +v +h +o +x +j +b +c +q +m +z +y +p +r +— +ú +d +g +í +é +á +ó +f +– +0 +1 +- +4 +ñ +5 +3 + diff --git a/full_models/izr/D_100000.pth b/full_models/izr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c767d7704717a42fef90beef071460ec9c307510 --- /dev/null +++ b/full_models/izr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f990dd4349b4dacb31d472287d3e85eeecb940e722d25cc4f011129c956654b0 +size 561110117 diff --git a/full_models/izr/G_100000.pth b/full_models/izr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1315f07878f1941801c566a227dbc5be22e57565 --- /dev/null +++ b/full_models/izr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09cbe31c0b76b2d30ba5c4e7359412c6fa77e1033f73129f6809fda77a2b40b0 +size 436613397 diff --git a/full_models/izr/config.json b/full_models/izr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/izr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/izr/vocab.txt b/full_models/izr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b1c87aa4b7bc3f26750c8dd2b3e788727d929bc1 --- /dev/null +++ b/full_models/izr/vocab.txt @@ -0,0 +1,36 @@ +| +a +n +i +k +e +y +r +t +u +s +o +m +g +b +w +f +d +h +z +' +p +l +c +v +0 +j +1 +4 +ŕ +2 +— +ٔ +- +ł + diff --git a/full_models/izz/D_100000.pth b/full_models/izz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1481907b1c87b822a5c57e901d163e8cf7be423b --- /dev/null +++ b/full_models/izz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:930cfba33c44de1e37f5e8996b06e0d86e4fee6fe1814e68f2fa3b4d1db8f2ac +size 561079251 diff --git a/full_models/izz/G_100000.pth b/full_models/izz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e9167baae2bbfce308f7cb19e816e15cbd48aa28 --- /dev/null +++ b/full_models/izz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:561c20c1d0d2b087373b1ce90748be7ad8d94422942ece34424fbdfde3d887b5 +size 436404924 diff --git a/full_models/izz/config.json b/full_models/izz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/izz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/izz/vocab.txt b/full_models/izz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a54f729db1b8d9204bc13a0fe7d8f4811daa01b6 --- /dev/null +++ b/full_models/izz/vocab.txt @@ -0,0 +1,48 @@ +ú +è +f +y +s +ẹ +k +ḿ +ị +d +e +́ +j +_ +é +v +ó +p +z + +ń +ụ +í +ọ +t +l +̀ +u +i +á +w +c +r +ò +h +ù +o +ǹ +à +ì +n +' +- +b +m +a +6 +g diff --git a/full_models/jac/D_100000.pth b/full_models/jac/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8ef06c7ed2ff27a8c3ce42936415c30f57cb7c1e --- /dev/null +++ b/full_models/jac/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf133639c2ff8a1c03c81b0a6994699324efc4dc6b016ef4592bf3d40d155a20 +size 561109338 diff --git a/full_models/jac/G_100000.pth b/full_models/jac/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e267088cc2780e0cc487332556fe2e8d060467d2 --- /dev/null +++ b/full_models/jac/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:013ce41fe9c09703916f8b621a23863259b90ea050a46763a740dfea5e3c138c +size 436602023 diff --git a/full_models/jac/config.json b/full_models/jac/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jac/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jac/vocab.txt b/full_models/jac/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..568a97166602950b943e6179fc6140dfb83c5610 --- /dev/null +++ b/full_models/jac/vocab.txt @@ -0,0 +1,33 @@ +| +a +i +n +c +t +e +o +h +y +' +l +u +m +j +s +b +x +̈ +w +k +z +p +r +d +ẍ +- +q +g +f +v +` + diff --git a/full_models/jam/D_100000.pth b/full_models/jam/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b26fa1ed6a7b2bc09f9e16db9f33836624b21de7 --- /dev/null +++ b/full_models/jam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec659c5180da3cfd55dddf0fd07897b5f561c540c855d7a37c649be134419a6b +size 561109870 diff --git a/full_models/jam/G_100000.pth b/full_models/jam/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eda3c895e1a7cec90cf8d7555c371572c9aa8e88 --- /dev/null +++ b/full_models/jam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db701a316c7eaaa27a2d4e8470e9f6c6f070622343d27778f10142e311481f11 +size 436593051 diff --git a/full_models/jam/config.json b/full_models/jam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jam/vocab.txt b/full_models/jam/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..85323e9eda8e22c7e6fda65d44a5771d06fda0d7 --- /dev/null +++ b/full_models/jam/vocab.txt @@ -0,0 +1,29 @@ +| +i +a +n +d +e +u +m +o +s +t +w +l +k +p +g +r +f +b +h +v +y +z +j +c +— +- +' + diff --git a/full_models/jav/D_100000.pth b/full_models/jav/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d8daf7e1647f2c825c43c566fe50fd952aed210 --- /dev/null +++ b/full_models/jav/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e358a7df3ad63ad45c4462739b9a8eed6a9945cecf4bd345520208c78e6d837 +size 561079102 diff --git a/full_models/jav/G_100000.pth b/full_models/jav/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9cc7e92c53f52357a23d9f091b5621d23869cea5 --- /dev/null +++ b/full_models/jav/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d875f17cbfa6520935c3255664fcda13a081f1b6bfceac126377691e14c83fcc +size 436354616 diff --git a/full_models/jav/config.json b/full_models/jav/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jav/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jav/vocab.txt b/full_models/jav/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..458b746b96e70268ade598d84c5668f74d318748 --- /dev/null +++ b/full_models/jav/vocab.txt @@ -0,0 +1,26 @@ +a +| +n +g +i +e +k +u +s +r +t +p +m +l +d +h +o +w +b +y +j +- +c +f +z + diff --git a/full_models/jbu/D_100000.pth b/full_models/jbu/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..58d546866220d072cd707ca299b4195cf17ae1a4 --- /dev/null +++ b/full_models/jbu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a09cb80676fbad84a9783027cedac33388d249b1f0cfd63cf27d8d4e68bc32d +size 561078999 diff --git a/full_models/jbu/G_100000.pth b/full_models/jbu/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef8180e2d559c2a202b3bb47ffcd670201190d66 --- /dev/null +++ b/full_models/jbu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c83d3ffb0e529eece32815e4d43cff9108a6b4ae7428d14b14a435fe6996b22 +size 436404197 diff --git a/full_models/jbu/config.json b/full_models/jbu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/jbu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jbu/vocab.txt b/full_models/jbu/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..a4a268d8d3db7e01dee89575dd21ec2d99dd93fd --- /dev/null +++ b/full_models/jbu/vocab.txt @@ -0,0 +1,48 @@ +| +a +n +i +u +b +k +e +d +w +y +o +r +s +m +t +c +j +z +p +h +f +g +à +v +­ +' +í +l +ī +ò +á +ú +ā +ù +è +ì +é +ō +ē +- +̀ +ó +ḿ +ū +q +â + diff --git a/full_models/jen/D_100000.pth b/full_models/jen/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a78d80a7d93961651a134cc21cbb95dcf388d70e --- /dev/null +++ b/full_models/jen/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f859faf0c4a8d1fe50743e86c818528447d01340597789be27649d765a1677fb +size 561076175 diff --git a/full_models/jen/G_100000.pth b/full_models/jen/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5db5e3c58e8b6860af3dad0398af9202c35d943 --- /dev/null +++ b/full_models/jen/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93c30e95eccb847431c61aa6657915e837fe01040444c2c2d9c9648c955a3a61 +size 436355535 diff --git a/full_models/jen/config.json b/full_models/jen/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jen/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jen/vocab.txt b/full_models/jen/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c0afe138623030773f10c23b578c1caf29775677 --- /dev/null +++ b/full_models/jen/vocab.txt @@ -0,0 +1,36 @@ +8 +m +ɨ +s +y +t +i +c +r +k +f +_ +z +e +ɛ +̃ +p + +v +b +ã +j +h +g +u +d +l +w +ũ +ɔ +a +ĩ +' +n +o +ə diff --git a/full_models/jic/D_100000.pth b/full_models/jic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e738c5c7d9933894ca05192be0e049b75f4f59c4 --- /dev/null +++ b/full_models/jic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a17e6a19f44343489a651f9dce527e9aad316cb9a4553d9d47b997c41890dd5a +size 561108991 diff --git a/full_models/jic/G_100000.pth b/full_models/jic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f319794440ffa6676c2d904faaea4bc6719a0010 --- /dev/null +++ b/full_models/jic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:532662d6873ef74b17fc3c39af0417068ecabe3e8f5979650a200c8c97f13d63 +size 436625078 diff --git a/full_models/jic/config.json b/full_models/jic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jic/vocab.txt b/full_models/jic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..70d8cc0f1cf6dc6e772b6c3f5f2e2cd11f2c0fcc --- /dev/null +++ b/full_models/jic/vocab.txt @@ -0,0 +1,43 @@ +| +a +j +n +s +p +l +i +e +t +u +o +m +c +y +ü +ꞌ +w +á +' +d +v +q +é +r +í +ó +ú +̈ +g +b +— +ǘ +z +f +h +ñ +x +0 +1 +2 +k + diff --git a/full_models/jiv/D_100000.pth b/full_models/jiv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4bf3e6289f0b6de2ebfe4d12725e4d9bee37dc49 --- /dev/null +++ b/full_models/jiv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e89d0355ab1f079548f2147aca023e387525ff21ab342a7ce0dceea620f0477d +size 561109996 diff --git a/full_models/jiv/G_100000.pth b/full_models/jiv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..07035659570862a33941b754770e6a08cee7a078 --- /dev/null +++ b/full_models/jiv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e440de2cadb51e569682ddee0885d82d887a0273ce650ca72e1a6766146791d +size 436587668 diff --git a/full_models/jiv/config.json b/full_models/jiv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jiv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jiv/vocab.txt b/full_models/jiv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..52ec18dc835f2cb66f111552d8f7a44e67d2de0c --- /dev/null +++ b/full_models/jiv/vocab.txt @@ -0,0 +1,26 @@ +a +| +i +u +n +t +r +s +m +k +h +e +̱ +j +y +á +c +w +p +í +ṉ +ú +é +ð +- + diff --git a/full_models/jmc/D_100000.pth b/full_models/jmc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6c2459b8a3237b1c96999f38135895a99d00f042 --- /dev/null +++ b/full_models/jmc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf68832688004cf51ada524027ad9e9e4aa9bf83a80ba57da39818d3783be0fb +size 561110384 diff --git a/full_models/jmc/G_100000.pth b/full_models/jmc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..258ef9a977d5a57452f39b8f987fe0578208645d --- /dev/null +++ b/full_models/jmc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868e29efa05f8ac2e9563baa94916807e78f4f0199962aea0e02dbcdc0846442 +size 436607080 diff --git a/full_models/jmc/config.json b/full_models/jmc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jmc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jmc/vocab.txt b/full_models/jmc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..650db881a13f93e5d9c408e2c4986fcb7fcc8a7b --- /dev/null +++ b/full_models/jmc/vocab.txt @@ -0,0 +1,33 @@ +a +| +i +n +e +y +k +u +o +m +s +l +w +v +r +d +h +f +t +b +g +- +p +' +z +0 +4 +j +1 +6 +3 +2 + diff --git a/full_models/jmd/D_100000.pth b/full_models/jmd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a113341dd7424a0bc2d3ac34667b9e0b50b3e077 --- /dev/null +++ b/full_models/jmd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ae73539a0842abb261a0848973c23af0cefe3b746f81c3c1f073839fdf9011 +size 561076040 diff --git a/full_models/jmd/G_100000.pth b/full_models/jmd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3e06e3e0d973d44af9b945676a69f830cbdbdd2e --- /dev/null +++ b/full_models/jmd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35631139784ce226a3fffd23cca466ce7917cb50c69368818dbda087abfa5851 +size 436333778 diff --git a/full_models/jmd/config.json b/full_models/jmd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jmd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jmd/vocab.txt b/full_models/jmd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4778f923a690658ce61e24ff42f66273fbd4d351 --- /dev/null +++ b/full_models/jmd/vocab.txt @@ -0,0 +1,27 @@ +o +s +k +i +t +d +p +- +_ +c +w +a +' +u +b +h +g +r +e +j +l +n +z +y + +f +m diff --git a/full_models/jun/D_100000.pth b/full_models/jun/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7a5aa3dcbf31769a6442880f1459126f4b5efb0b --- /dev/null +++ b/full_models/jun/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5e39ffc3f890fb5192fabd8178bb58a631cc39eeda76ae70c3c8a023b781511 +size 561078745 diff --git a/full_models/jun/G_100000.pth b/full_models/jun/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e5fadcc8b94ffd0f17e3aeb09e966b41e3223330 --- /dev/null +++ b/full_models/jun/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631c0dbe1e26e25d07c56410ee250b4cd49972f5ce90b8bc9c15e5226115abdc +size 436429282 diff --git a/full_models/jun/config.json b/full_models/jun/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jun/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jun/vocab.txt b/full_models/jun/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5d4342b9a689954fe08c304897983d3a3dbbbc78 --- /dev/null +++ b/full_models/jun/vocab.txt @@ -0,0 +1,59 @@ +ଙ +ଖ +୯ +ୃ +ଁ +ଠ +୩ +ଧ +ଥ +ୟ +ନ +ଚ +ଫ +ଏ +ଂ +ପ +ଓ +ଲ +୫ +ଜ +ଉ +‍ +ଅ +୪ +ୈ +ବ +ଳ +ଟ +ଶ +ର +୬ +ତ +ଞ +ସ +ଷ +୨ +଼ +ି +ମ +' +ୁ + +୦ +- +୧ +୍ +େ +_ +ଗ +ଦ +ହ +ଯ +କ +ଣ +ଇ +ଡ +ା +ୋ +ଆ diff --git a/full_models/juy/D_100000.pth b/full_models/juy/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..705063a20d7ea248057740b895a55ce58d0a8911 --- /dev/null +++ b/full_models/juy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bff242b8d5a9bcc778ebdd82964f5109c479c2924c46aea4849d981fa90a1a7 +size 561076023 diff --git a/full_models/juy/G_100000.pth b/full_models/juy/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..adea51c65eb30c6bb9b842b80152514fc001b959 --- /dev/null +++ b/full_models/juy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da3afbc812016e4ef1768ee6026f0aa7995dd3f7c798a119e3c00a7c301e67f +size 436361277 diff --git a/full_models/juy/config.json b/full_models/juy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/juy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/juy/vocab.txt b/full_models/juy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6960b9bec8705dc0f3e126d87d4e085539b4b680 --- /dev/null +++ b/full_models/juy/vocab.txt @@ -0,0 +1,39 @@ +୍ +| +ନ +ି +େ +ଆ +ଡ +ା +ର +ଜ +ଙ +ତ +ମ +ଲ +ବ +ସ +ଞ +ୟ +ୋ +ୁ +ଅ +କ +ଗ +ପ +ଏ +଼ +ଇ +ୱ +ଣ +ଃ +ଦ +ଓ +ଉ +ଁ +ଟ +ଂ +' +‍ + diff --git a/full_models/jvn/D_100000.pth b/full_models/jvn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..16642330b0bb16e22d747fcb7cea192a5257ad08 --- /dev/null +++ b/full_models/jvn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1479916caa5252b1b71f4d32aab46b8ddf71f51ccff3acb1d65788542f39e8cf +size 561109372 diff --git a/full_models/jvn/G_100000.pth b/full_models/jvn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4be7f6542c13b6368d4ea7a516568115d125846f --- /dev/null +++ b/full_models/jvn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d9a6bb40220e0886dd9ee4f7d6999d7b9b411ae541e5a29a3ee91c44f1ca5b +size 436606857 diff --git a/full_models/jvn/config.json b/full_models/jvn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/jvn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/jvn/vocab.txt b/full_models/jvn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..78d3485eb6181e6d22158d9cfa50ea4d7e72377b --- /dev/null +++ b/full_models/jvn/vocab.txt @@ -0,0 +1,35 @@ +| +a +n +g +k +i +u +s +é +r +t +o +l +e +w +d +m +p +b +è +y +h +j +- +f +v +0 +' +z +8 +1 +2 +5 +6 + diff --git a/full_models/kaa/D_100000.pth b/full_models/kaa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..98c0ee17565262bf5ed4c7de793a3968bcf5f6ef --- /dev/null +++ b/full_models/kaa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33607fac4aa4d2de3d7ecfb9ddef6c2ac8b3868396e2287c192e2f55eca682a3 +size 561110012 diff --git a/full_models/kaa/G_100000.pth b/full_models/kaa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..130e69f483ad482ca3539218c9bb15ec90e1169c --- /dev/null +++ b/full_models/kaa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72108114df01b27d0b0aed51b34bf5da441bfcd08d3100aa0a21ef66af5f43d1 +size 436637029 diff --git a/full_models/kaa/config.json b/full_models/kaa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kaa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kaa/vocab.txt b/full_models/kaa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..18384f1b36dbbee4adaade2379ee0fde1cb858f3 --- /dev/null +++ b/full_models/kaa/vocab.txt @@ -0,0 +1,47 @@ +| +а +е +и +ы +н +л +р +д +с +т +м +б +й +о +ќ +п +у +з +к +ш +њ +ў +ѓ +ж +є +г +ҳ +ү +қ +х +ң +μ +ғ +я +– +ѳ +ә +ө +в +- +ь +ф +ю +э +ц + diff --git a/full_models/kab/D_100000.pth b/full_models/kab/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..419e6b6ba16a6ab97be03dac946d7e63cfc2e5e6 --- /dev/null +++ b/full_models/kab/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:379c788b72f84f49a6a9cb798a3e862f63e3ba33f0ec3d9ad21ae2f9f7f60d57 +size 561109081 diff --git a/full_models/kab/G_100000.pth b/full_models/kab/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b2af17fa22e32d8d400192551d16e2a58603731 --- /dev/null +++ b/full_models/kab/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb8e941f7ebfe48a8133d140480f4e258536b2815ce9de45f6e192a0830ec32 +size 436613530 diff --git a/full_models/kab/config.json b/full_models/kab/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kab/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kab/vocab.txt b/full_models/kab/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5848416cec6922387a63adf3dc83a7f483f1c27a --- /dev/null +++ b/full_models/kab/vocab.txt @@ -0,0 +1,38 @@ +| +a +e +i +n +d +t +l +s +m +r +u +- +y +w +k +ɣ +b +g +ṛ +ɛ +f +q +ḥ +c +z +x +ṭ +ḍ +h +ṣ +ǧ +č +ẓ +j +' +‐ + diff --git a/full_models/kac/D_100000.pth b/full_models/kac/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4ac58e3c3e29581fcc6664a194c7a19eda76bbff --- /dev/null +++ b/full_models/kac/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:750ae9d153b406873c64e0a0bf544214d53c6e2972a9faff098750c9750c7a9f +size 561110002 diff --git a/full_models/kac/G_100000.pth b/full_models/kac/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..acf76e2640b35e322406ecf2602c7dc1c4f34f59 --- /dev/null +++ b/full_models/kac/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd0e74e8f041a9b370e6a822b818ce4c3045e518fb2b3f6ff3f76c544fd773a +size 436586464 diff --git a/full_models/kac/config.json b/full_models/kac/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kac/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kac/vocab.txt b/full_models/kac/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0aca77876186ff4ce00e9b3f83d03537852cf09a --- /dev/null +++ b/full_models/kac/vocab.txt @@ -0,0 +1,26 @@ +| +a +n +i +h +g +m +u +t +e +s +w +k +r +d +y +l +p +j +b +o +c +z +- +' + diff --git a/full_models/kak/D_100000.pth b/full_models/kak/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..70f0a09c3b58d6863d8290c706d4da40aacd1107 --- /dev/null +++ b/full_models/kak/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3d7f51f4190dd55c8f288d20b43d28981e3231f54d3ff7597c9157615387bc +size 561078491 diff --git a/full_models/kak/G_100000.pth b/full_models/kak/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..18060b4d835adcd56502a271dde889b170cd2a70 --- /dev/null +++ b/full_models/kak/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c3db1b5c18bef17426a72bf2e98cb4d394cffdf1822b29291de24eebb65ebe2 +size 436368959 diff --git a/full_models/kak/config.json b/full_models/kak/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kak/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kak/vocab.txt b/full_models/kak/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..caf6b64c84c09df35de27f3a40f1c73cebd0b3a2 --- /dev/null +++ b/full_models/kak/vocab.txt @@ -0,0 +1,34 @@ +x +a +v +k +b +_ +c +o +y +r +q +' +p +i +e +d +l +t +ñ +â +w +6 +g + +j +m +h +z +1 +f +u +s +- +n diff --git a/full_models/kan/D_100000.pth b/full_models/kan/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f26c0785417a8771656966ee40ab2081655a4ad --- /dev/null +++ b/full_models/kan/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f67cc5123600a20fc5146f7bac86f3dd49892beccc20f251df0563a5109b04 +size 561110493 diff --git a/full_models/kan/G_100000.pth b/full_models/kan/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..731b363a96c56079268a253569e615be7f8fb388 --- /dev/null +++ b/full_models/kan/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e1ddd60f7ad8e7a91d068059bdcd45a4c4f878ff1c19564fbf3e611568fd2e +size 436704808 diff --git a/full_models/kan/config.json b/full_models/kan/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kan/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kan/vocab.txt b/full_models/kan/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..4cf3f10b9032d0b37c1d699646f5a88b81da7526 --- /dev/null +++ b/full_models/kan/vocab.txt @@ -0,0 +1,75 @@ +' +ಓ +ಮ +ಆ +ಭ +ಋ +ಚ +ಟ +ು +ೇ +ಜ +ಏ +ಾ +ಪ +ಶ +್ +ಈ +ಔ +ಞ +1 +ನ +ಎ +ಸ +ವ +ಇ +ಘ +5 +ಊ +ಳ +ಖ +ೃ +ೆ +- +ತ +ಝ +ಢ + +ಅ +ಧ +ೌ +ಹ +ಯ +9 +ಫ +ಛ +8 +6 +ಲ +ಣ +_ +ದ +ಬ +ಠ +ಡ +ಃ +3 +ೋ +ಂ +ಒ +ೀ +ಕ +ಿ +ಥ +ರ +ೂ +ಐ +ೈ +ಉ +2 +0 +ಗ +ೊ +ಷ +4 +7 diff --git a/full_models/kao/D_100000.pth b/full_models/kao/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3aa87d5411508130c0ac38e6c0d025095d599ec --- /dev/null +++ b/full_models/kao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ec8955bf3f41f7d5b1428143517233b6c4b8763dc576b82ab307b629fafe5d +size 561109715 diff --git a/full_models/kao/G_100000.pth b/full_models/kao/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e1c36e06c24a6605cc93fa07d42b6a47ec21c749 --- /dev/null +++ b/full_models/kao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18463f98b0b6f6aa305f4313faa35dc58d6f63bc12799debacfd1ce916619dc +size 436599975 diff --git a/full_models/kao/config.json b/full_models/kao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kao/vocab.txt b/full_models/kao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4515cd955f2f734e9ae951874c79c062dfa8f71a --- /dev/null +++ b/full_models/kao/vocab.txt @@ -0,0 +1,32 @@ +| +a +n +o +i +l +e +u +x +t +m +b +s +k +d +w +r +f +y +ɲ +' +g +ŋ +j +í +ń +h +p +é +c +­ + diff --git a/full_models/kaq/D_100000.pth b/full_models/kaq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2d4d2b2e7c54b0ebd350438cd4e5efdbc7f8203e --- /dev/null +++ b/full_models/kaq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b9765ac78c7c36168e77364988df5ecadd9f95957be31a1d546f4bda012b00d +size 561078710 diff --git a/full_models/kaq/G_100000.pth b/full_models/kaq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1187a01e820c732490b14d3eb65883e87eb25175 --- /dev/null +++ b/full_models/kaq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2eb87279b3544d70ee218b5872ad00bd36119469a8dced293193e174ae52e0e +size 436370964 diff --git a/full_models/kaq/config.json b/full_models/kaq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kaq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kaq/vocab.txt b/full_models/kaq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f4b9d0c0ed9404b25139c5f6506a7eb60fc99078 --- /dev/null +++ b/full_models/kaq/vocab.txt @@ -0,0 +1,34 @@ +x +ú +l +g +k +p +t +ó +f +_ +u +b +— +n +v +c +j +z +d +q + +o +í +h +y +a +ñ +s +i +m +á +é +r +e diff --git a/full_models/kay/D_100000.pth b/full_models/kay/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c46d274a0ad55847b13fbd21b03f156d4c145dac --- /dev/null +++ b/full_models/kay/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620b83907275f0b945472ffe192ad69cde0a144972a615fc2a9af5b3d010c4c4 +size 561076077 diff --git a/full_models/kay/G_100000.pth b/full_models/kay/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d2c2b69666332056b57f525f2d576b88af1bbbae --- /dev/null +++ b/full_models/kay/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7767d57ec59a338b48fdf187964b3d62dd0898aabaa76210e2b96f8e21f9101 +size 436376005 diff --git a/full_models/kay/config.json b/full_models/kay/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kay/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kay/vocab.txt b/full_models/kay/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7d4f587d158786b15f440027df59e5fa67fd2da2 --- /dev/null +++ b/full_models/kay/vocab.txt @@ -0,0 +1,45 @@ +ã +m +ỹ +l +z +f +ẽ +u +n +w +x +ç +ĩ +' +j +t +5 +s +6 +a +c +1 +9 +— +õ +ũ +e +_ +k +d +v +y +2 +p +0 +h +i +b +g +7 +3 +o +r +8 + diff --git a/full_models/kaz/D_100000.pth b/full_models/kaz/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ee1598605cf4ab1d5f111269a228a117be9a3b5 --- /dev/null +++ b/full_models/kaz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d33eb3dee600848d54fabe640e895ff96b93b3b0e3a5088952467d932ccb439 +size 561079120 diff --git a/full_models/kaz/G_100000.pth b/full_models/kaz/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..17d07769454756483e69bc778c325a1f94c89333 --- /dev/null +++ b/full_models/kaz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a44d437d37859db55689f8043cd77886e4201fba3eae2399384b129dad6abc +size 436394583 diff --git a/full_models/kaz/config.json b/full_models/kaz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kaz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kaz/vocab.txt b/full_models/kaz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6dddc92cc4905f7b3be45d33f1c727287282f562 --- /dev/null +++ b/full_models/kaz/vocab.txt @@ -0,0 +1,43 @@ +р +т +ұ +б +ү +у +ь +- +ю +ы +ш +й +в +_ +к +л +ң +ц +а +м +з +х +ә +һ +щ +е +ж +п +д +— +ф +э +г +қ +і +ғ +и +о + +н +с +я +ө diff --git a/full_models/kbo/D_100000.pth b/full_models/kbo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ab7273e35cc5dc254aa2727f57a0c3e6b3a81fc6 --- /dev/null +++ b/full_models/kbo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64264d09d1154b53972d2067b21b1518d209823703f5e1c3caab859fc41632d +size 561078845 diff --git a/full_models/kbo/G_100000.pth b/full_models/kbo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..86b8ac8b6e219b76d106c284f7682d17b14fce31 --- /dev/null +++ b/full_models/kbo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ba57a441b00282ec57d5e894732a89e1ff291bb92440608538c3b2b0a69b8f5 +size 436408221 diff --git a/full_models/kbo/config.json b/full_models/kbo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kbo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kbo/vocab.txt b/full_models/kbo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c54deae389d009f6406c2ce28beba272efcd90b7 --- /dev/null +++ b/full_models/kbo/vocab.txt @@ -0,0 +1,50 @@ +s +t +i +ẽ +̃ +ị +ụ +o +g +u +m +l +ô +a +ọ +â + +́ +h +̂ +í +k +á +ꞌ +d +b +é +ũ +j +ộ +z +ĩ +p +ŋ +î +n +õ +_ +ã +e +f +v +y +' +c +ẹ +w +ú +r +ó diff --git a/full_models/kbp/D_100000.pth b/full_models/kbp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b84d9752add1cb2dee16615a878b27ba0b2a34e8 --- /dev/null +++ b/full_models/kbp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:477d01aa2de842d15039ffc472f5996b39a93ff0c9033f7636de3f39ee1401c3 +size 561079363 diff --git a/full_models/kbp/G_100000.pth b/full_models/kbp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a518bcf5d046a6268dee764b704b8332d436dbff --- /dev/null +++ b/full_models/kbp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1142d9c939d4af15fd38c8fe8e582bd672aa1ef95837b9e3810bb07d6451f53e +size 436395196 diff --git a/full_models/kbp/config.json b/full_models/kbp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kbp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kbp/vocab.txt b/full_models/kbp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9a3f6c515c050ecf2caab4acbe3630d960885b7d --- /dev/null +++ b/full_models/kbp/vocab.txt @@ -0,0 +1,43 @@ + +f +ɖ +é +z +t +- +i +ó +b +ɛ +n +e +k +m +ḿ +c +́ +g +ñ +đ +ú +ʋ +v +h +p +u +o +ń +j +y +l +a +ɣ +ɔ +r +á +ɩ +_ +w +ŋ +s +d diff --git a/full_models/kbq/D_100000.pth b/full_models/kbq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4d5623272058c66f8219ebe2092840bc459c2580 --- /dev/null +++ b/full_models/kbq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793cef0941443f292884fc378e1e302c6760032b0820ab5570bd4e6a64e8945d +size 561078986 diff --git a/full_models/kbq/G_100000.pth b/full_models/kbq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1382f52897118cf05d1c3308aad5cb8d599d8f38 --- /dev/null +++ b/full_models/kbq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3f4faf7f7e4803b93299169ab205ebeb28dbbc6f6b6a255bfde74624bd6dcc4 +size 436384104 diff --git a/full_models/kbq/config.json b/full_models/kbq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kbq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kbq/vocab.txt b/full_models/kbq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..87ae524b301917c1ee61be92a87202a2443c7dbe --- /dev/null +++ b/full_models/kbq/vocab.txt @@ -0,0 +1,39 @@ +u +8 +0 +v +m +f + +l +7 +1 +2 +y +_ +4 +h +g +p +- +d +e +a +3 +5 +q +i +b +6 +t +z +o +' +k +w +s +9 +x +r +n +j diff --git a/full_models/kbr/D_100000.pth b/full_models/kbr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..87614f89ce45e1ffa3d0494c4f1cf6dd6c4788c1 --- /dev/null +++ b/full_models/kbr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f8cee097e86daef3c236c3494963c81aa3da50460ed4a979ac4b59feb395da +size 561109849 diff --git a/full_models/kbr/G_100000.pth b/full_models/kbr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cc9d90fcf4ca58fcd9314fc32c7dd49baeb044ff --- /dev/null +++ b/full_models/kbr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5932ff7a807459c9e9b522ca8465e2f78757984ac94952af973d87f4ba50685 +size 436599994 diff --git a/full_models/kbr/config.json b/full_models/kbr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kbr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kbr/vocab.txt b/full_models/kbr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5a530570ed9fca04e54418d3dbd2664217e42771 --- /dev/null +++ b/full_models/kbr/vocab.txt @@ -0,0 +1,32 @@ +| +o +a +i +e +n +h +t +b +c +y +s +m +u +l +g +k +r +q +d +' +w +x +f +j +p +- +z +6 +1 +4 + diff --git a/full_models/kby/D_100000.pth b/full_models/kby/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e47bd1f435f4ef3104cefa94b308d0d443a743d --- /dev/null +++ b/full_models/kby/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8267af64b74a48ad386198cc41e45b269e715e31b0cb2b2b981948875b581854 +size 561076841 diff --git a/full_models/kby/G_100000.pth b/full_models/kby/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..806b9c44f09e305b7659ce833f5d9c263ea39ac3 --- /dev/null +++ b/full_models/kby/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e02d685084d6bc1dae0fe74f6a5662c41c83276fc0b5661fd9f11bbf08f9df4 +size 436359756 diff --git a/full_models/kby/config.json b/full_models/kby/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kby/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kby/vocab.txt b/full_models/kby/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..de3ff4e8603af8f37b640d17fe0e1f1aae009aac --- /dev/null +++ b/full_models/kby/vocab.txt @@ -0,0 +1,30 @@ +w +t +h +s +n +j +k +p +y +f +l +e +o +_ +m +a +g +- +b +' +3 +u +4 +i +r +ǝ +ɍ +c +d + diff --git a/full_models/kca/D_100000.pth b/full_models/kca/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d91212d4fb87268031146168012717b2603187d1 --- /dev/null +++ b/full_models/kca/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df2531b619a9613e28f5eb211d3d24d0b44c4b66652d7937b13efefa1dfd3c6 +size 561076065 diff --git a/full_models/kca/G_100000.pth b/full_models/kca/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b9b3cc328f39306c561f290989dd73dbe5385a0 --- /dev/null +++ b/full_models/kca/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be196035d2df74f13482bef1367a62f22b2a017c7d633cbbad33a0829a6f79d +size 436378179 diff --git a/full_models/kca/config.json b/full_models/kca/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kca/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kca/vocab.txt b/full_models/kca/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2b6be3f22fb80dfef2a5077a5d98e67616fae3d8 --- /dev/null +++ b/full_models/kca/vocab.txt @@ -0,0 +1,46 @@ +ц +– +' +ч +к +м +з +ӑ +ә +ԓ +с +п +ш +в +е +ă +ў +ԋ +т +ы +х +ŏ +р +ӈ + +- +г +_ +у +ԉ +ԏ +о +и +й +д +н +э +ф +ь +ё +ю +л +я +а +щ +б diff --git a/full_models/kcg/D_100000.pth b/full_models/kcg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b74991b62f002b806f1cccd013ba92949b4d7c51 --- /dev/null +++ b/full_models/kcg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8105f778620b06a45d1d776895ebb47929239c3f72d708e02722cecc2306c9ed +size 561078607 diff --git a/full_models/kcg/G_100000.pth b/full_models/kcg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c76adba59974bd1e702b69fdb1beefbd973ad542 --- /dev/null +++ b/full_models/kcg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ace552497f11c5290fef73eb8ae988140c3b96d1efdacc0df8ca2825a4f402e2 +size 436368840 diff --git a/full_models/kcg/config.json b/full_models/kcg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kcg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kcg/vocab.txt b/full_models/kcg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..09936a28e32e8bf8bb1b54abad233a270acb4ad7 --- /dev/null +++ b/full_models/kcg/vocab.txt @@ -0,0 +1,34 @@ +á +_ +í +y +ó +a +v +̱ +o +w +z +n +g +k +d +j +i +s +t +ú +r +' +p +l +é +m +f + +h +b +u +e +- +c diff --git a/full_models/kdc/D_100000.pth b/full_models/kdc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..11e5c4f280661b2a0ea1e474f745169e34041cc2 --- /dev/null +++ b/full_models/kdc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a285f3ef2d0fc8bd3428219542fb2b25e158ae09b16ec1b481a2d98efd14ddf +size 561079007 diff --git a/full_models/kdc/G_100000.pth b/full_models/kdc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cac778e1459d45c05d6aa58cfd2d8f38d7880d02 --- /dev/null +++ b/full_models/kdc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b0771d0ec8890eb1a95c6fea3482a9e75939186fb2b06a87e738622b252bc4d +size 436354465 diff --git a/full_models/kdc/config.json b/full_models/kdc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kdc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kdc/vocab.txt b/full_models/kdc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..86a8d34e0dcf24a9cc5d1b72ca491cd66cff2193 --- /dev/null +++ b/full_models/kdc/vocab.txt @@ -0,0 +1,26 @@ +l +f +c +m +s +p +e +o +i +u +v +h +a +' +z +d +g +w + +k +b +j +t +n +y +_ diff --git a/full_models/kde/D_100000.pth b/full_models/kde/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bb8e313fb62d76fae123b18a22e326d5794c6835 --- /dev/null +++ b/full_models/kde/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a41ed53ae71cd04c73926257e521ccb050f7c32584903ed9a333e2841f25c7 +size 561079118 diff --git a/full_models/kde/G_100000.pth b/full_models/kde/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..033af9a421cf6b64e13ba3c0713c8e56c06022b5 --- /dev/null +++ b/full_models/kde/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8169e4cacb3041269d8b8d6a6e2baa841984a87c2bd1e5a52b894a2c3f0903 +size 436370528 diff --git a/full_models/kde/config.json b/full_models/kde/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kde/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kde/vocab.txt b/full_models/kde/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..498a19a2b01b566d3e37f39d0abdd9b4b7414959 --- /dev/null +++ b/full_models/kde/vocab.txt @@ -0,0 +1,33 @@ +í +w +g +è +e +y +d +a +l + +u +_ +o +h +ó +k +j +á +s +i +ù +' +ú +b +p +- +t +m +ì +à +é +v +n diff --git a/full_models/kdh/D_100000.pth b/full_models/kdh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3d067fa65d39aaf7583add79e1bc32f84319c6f4 --- /dev/null +++ b/full_models/kdh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abadba6d151e105b77ca32856e7e18af4dea6840669b8d6db2ec8b1404d5f845 +size 561078852 diff --git a/full_models/kdh/G_100000.pth b/full_models/kdh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ab8e3f5bb2f7382a6d90e25c7f61cece4c32cf2d --- /dev/null +++ b/full_models/kdh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b645099acf6e26acede1f2fe460ac7df69e7a00950f88ef235c18cc8c521e7b +size 436395414 diff --git a/full_models/kdh/config.json b/full_models/kdh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/kdh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kdh/vocab.txt b/full_models/kdh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..87c37d9e7b6fdd8eb1669b18779ad75bcf5cb247 --- /dev/null +++ b/full_models/kdh/vocab.txt @@ -0,0 +1,43 @@ +| +ɩ +́ +a +ɛ +n +á +ɔ +b +s +m +w +d +l +ʊ +k +r +e +ɖ +t +y +g +í +i +z +o +- +é +ú +u +ŋ +v +ń +f +j +ó +c +ḿ +p +h +‐ +ÿ + diff --git a/full_models/kdi/D_100000.pth b/full_models/kdi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fb9e8d2e3866cfb049e91c660478b81f090a9544 --- /dev/null +++ b/full_models/kdi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d94a331c90ac0c5c4597e835d822eff4a6a5f0f70e8be52d66ab74f694899ad2 +size 561110014 diff --git a/full_models/kdi/G_100000.pth b/full_models/kdi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..27a38fc163e79c14bb51e7b40b25cd886df0415b --- /dev/null +++ b/full_models/kdi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf88eff8a13580b2911cdd8b84898f4940fa12b661187eedb371e1e9f563cb2 +size 436590777 diff --git a/full_models/kdi/config.json b/full_models/kdi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kdi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kdi/vocab.txt b/full_models/kdi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..95748e8fab4c0d7d3aa2230a2ecdef99c5e054f9 --- /dev/null +++ b/full_models/kdi/vocab.txt @@ -0,0 +1,27 @@ +| +o +e +a +i +k +n +m +d +u +t +g +r +b +w +l +y +p +c +s +j +' +4 +3 +0 +- + diff --git a/full_models/kdj/D_100000.pth b/full_models/kdj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..23c83989e80882f7503b508f0e770e44f6709ec9 --- /dev/null +++ b/full_models/kdj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f61be138fa66ffac46cd24c3354cd9d7f92a36342c0a443ea368a165eccfd839 +size 561110135 diff --git a/full_models/kdj/G_100000.pth b/full_models/kdj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91bd5745c9223d068c2fcad7ed2323086c254b78 --- /dev/null +++ b/full_models/kdj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b3c6a19c06b846dd50a33ed92c7df800eac3f478a8b8ca7e5f50a844157c7e6 +size 436590365 diff --git a/full_models/kdj/config.json b/full_models/kdj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kdj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kdj/vocab.txt b/full_models/kdj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3d0d77612e92df5fa86f4e214869d67cb0cf8949 --- /dev/null +++ b/full_models/kdj/vocab.txt @@ -0,0 +1,26 @@ +| +a +i +e +o +k +n +ŋ +u +t +r +l +y +s +m +p +d +b +w +c +j +g +– +- +' + diff --git a/full_models/kdl/D_100000.pth b/full_models/kdl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c82ea42a44c20695de649d2d9ce301a5ba0e6f58 --- /dev/null +++ b/full_models/kdl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ce2483df158673db098d7473f3de6b1696238fb30f0090382ee04c0795172c +size 561078633 diff --git a/full_models/kdl/G_100000.pth b/full_models/kdl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2cbdb8ea176d2454d2b2c741ea2e45947d2879ad --- /dev/null +++ b/full_models/kdl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:222bd7a9e3f59762b2f8fbfab5f08023fa9fa51dd886e556de573114d35f06a1 +size 436366645 diff --git a/full_models/kdl/config.json b/full_models/kdl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kdl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kdl/vocab.txt b/full_models/kdl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5b7193a1b8679fc91319887ba563471efde926ee --- /dev/null +++ b/full_models/kdl/vocab.txt @@ -0,0 +1,33 @@ +| +a +u +i +n +k +̱ +s +t +e +m +y +o +l +w +g +r +h +ɗ +b +p +v +c +d +z +ꞌ +ɓ +f +j +‐ +- +' + diff --git a/full_models/kdn/D_100000.pth b/full_models/kdn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7c1bb4c5461e1e24f216bcd2f441595368c31bc --- /dev/null +++ b/full_models/kdn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150cf674eb8e2ab45d94e80b31721e3d19aae3f3f46bfbe7f6d4d844cf06b35b +size 561109883 diff --git a/full_models/kdn/G_100000.pth b/full_models/kdn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..343e59b3c59f8a25366a888df8aeb90b847a5dc1 --- /dev/null +++ b/full_models/kdn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8eda042a17ade4e99d4007e81240baa6713435a94ae450a64f5bbe26912b63 +size 436593058 diff --git a/full_models/kdn/config.json b/full_models/kdn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kdn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kdn/vocab.txt b/full_models/kdn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d022b7723190e7d5d304d5490ea1e137bb7c6193 --- /dev/null +++ b/full_models/kdn/vocab.txt @@ -0,0 +1,29 @@ +a +| +i +u +n +k +e +m +l +d +o +w +t +h +z +y +p +s +b +g +v +c +f +j +r +- +' +– + diff --git a/full_models/kdt/D_100000.pth b/full_models/kdt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..891bbfe1f01df4b50eaa4e206105045257710f3d --- /dev/null +++ b/full_models/kdt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1c4c99ee4d6429a26c95074cc7631af29ecc76f8fee2d3b195524cfa04d5b9 +size 561078857 diff --git a/full_models/kdt/G_100000.pth b/full_models/kdt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ea0056caf5bc10abf8bd42c4d62411f5627dec0c --- /dev/null +++ b/full_models/kdt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98cbba97e0bd9701fda8bad1459ef73b0b489d84ab2572800e27a9d78669488 +size 436434720 diff --git a/full_models/kdt/config.json b/full_models/kdt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kdt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kdt/vocab.txt b/full_models/kdt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fba93360a3aee98379d68172be09c88e369dcdbf --- /dev/null +++ b/full_models/kdt/vocab.txt @@ -0,0 +1,61 @@ +៉ +ី +ះ +ង +ថ +ភ +ដ +ផ +ឹ +ខ +ូ +- +ញ +យ +ិ +ណ +រ +អ +ឱ +ៅ +ឋ +ែ +ា +ឥ +ល +ម +ឌ + +ឡ +េ +ស +ំ +្ +ព +ហ +គ +ួ +័ +ទ +ៃ +ឃ +ឿ +ុ +ន +៊ +៍ +ក +វ +ឆ +ោ +ើ +ជ +ឈ +់ +_ +ច +ៀ +ធ +ឺ +ត +ប diff --git a/full_models/kek/D_100000.pth b/full_models/kek/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..225cd0834bed867aa2b33ed585c736347702ab16 --- /dev/null +++ b/full_models/kek/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f711e2d3fc3fc0dfa2c8df4b9b99450e9cbaaa88fca34571f49d612076e581d4 +size 561109965 diff --git a/full_models/kek/G_100000.pth b/full_models/kek/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f67286f647333a88f638cfd6be2a02fd296c4452 --- /dev/null +++ b/full_models/kek/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de3b78c9cb2dde19c6bca20602eb87d424a309aac5ba93bac1916252d232bb55 +size 436611243 diff --git a/full_models/kek/config.json b/full_models/kek/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kek/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kek/vocab.txt b/full_models/kek/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ec1053e48d0ec10c33e29d013897fdc1a3a4f4f7 --- /dev/null +++ b/full_models/kek/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +u +c +l +n +' +e +t +̱ +b +x +o +h +k +r +j +s +q +m +y +d +p +z +— +- +ú +í +g +ó +é +f +á +v +ñ + diff --git a/full_models/ken/D_100000.pth b/full_models/ken/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cb6b4793a1c0b185750453f6cc367f00c81d45eb --- /dev/null +++ b/full_models/ken/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abbceef015de760d804bcf978df394509a791aca91f8801a7336a57df81a42fd +size 561109975 diff --git a/full_models/ken/G_100000.pth b/full_models/ken/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5569ed79bb7c0acc4ac71932b2fb93b94fd82941 --- /dev/null +++ b/full_models/ken/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:271e8c80feb3feb410de1f0bc3cf3e15b96da10a9fa863c293fe1e31f36b2f5f +size 436645797 diff --git a/full_models/ken/config.json b/full_models/ken/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ken/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ken/vocab.txt b/full_models/ken/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ed645458219c8cb20f8600307fedaf28f5133d16 --- /dev/null +++ b/full_models/ken/vocab.txt @@ -0,0 +1,51 @@ +| +ɛ +n +b +a +m +k +́ +ɔ +h +y +t +á +ɨ +i +ŋ +s +r +p +c +d +o +u +w +í +ʉ +̌ +g +e +f +ǎ +ǔ +ó +ú +̀ +l +ǒ +é +j +à +ě +ò +ǐ +- +ù +ì +' +è +v +ń + diff --git a/full_models/keo/D_100000.pth b/full_models/keo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..54a9e849ce7f7b6eb24f41a2918e8c4aa388caad --- /dev/null +++ b/full_models/keo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd88fee03b51f5aec3578c82c6f5185b67cd17c2f559c143215a6ba93283828b +size 561110236 diff --git a/full_models/keo/G_100000.pth b/full_models/keo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a0a3d5961218e6af8e86cc53dd0d7f5663562c34 --- /dev/null +++ b/full_models/keo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac7889c528d8d9d1b4471dcff57138bc2dbe5ec29e8e92b2fdf4097b8aece0c +size 436594787 diff --git a/full_models/keo/config.json b/full_models/keo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/keo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/keo/vocab.txt b/full_models/keo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8a2f396e0be32d82ee38af36c3dd37002ac19b95 --- /dev/null +++ b/full_models/keo/vocab.txt @@ -0,0 +1,28 @@ +| +a +i +u +o +k +n +e +l +r +d +t +g +y +b +ŋ +m +p +s +' +z +w +h +f +v +­ +— + diff --git a/full_models/ker/D_100000.pth b/full_models/ker/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f2183d3e3fe505dad8e0e6161e1bd231820e06b --- /dev/null +++ b/full_models/ker/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e29696dca45a55ca820c5d1ebaf30ad76947d974cd791e5d344cb37cae7c282 +size 561109747 diff --git a/full_models/ker/G_100000.pth b/full_models/ker/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1e2ad6d4946d56c68bc8bd86009cdbffd45daebd --- /dev/null +++ b/full_models/ker/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db6bfd9fb201b916c919e5b7a60c69a381c38e576fe9e9bd65ea922e6d061c8 +size 436646021 diff --git a/full_models/ker/config.json b/full_models/ker/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ker/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ker/vocab.txt b/full_models/ker/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e800de3a36ce7f8993ce384fae4aa77bc8712a73 --- /dev/null +++ b/full_models/ker/vocab.txt @@ -0,0 +1,52 @@ +| +a +ə +i +e +ŋ +k +n +m +t +u +r +d +b +l +o +w +s +g +y +p +h +ɗ +j +c +f +- +z +á +ɓ +' +v +ã +ó +é +õ +ẽ +ú +̃ +– +1 +0 +2 +3 +4 +5 +6 +7 +í +8 +9 + diff --git a/full_models/key/D_100000.pth b/full_models/key/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1ad93100cef465fdd9c5a9b6cd0528cd3226a836 --- /dev/null +++ b/full_models/key/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daef34d66942a8e062fd48c11b5a9d6ef7fcda9caab4608097eb49af044fdf72 +size 561078978 diff --git a/full_models/key/G_100000.pth b/full_models/key/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20bdfbc8cd5ccaa3046f99a099a5e0312b22b6f8 --- /dev/null +++ b/full_models/key/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3618f30eac0d5e7e6f5e02506b7dab13592006a5c25c1eb4f66a05bda528f368 +size 436415134 diff --git a/full_models/key/config.json b/full_models/key/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/key/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/key/vocab.txt b/full_models/key/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..52304e5c1db7ff627716dcfb7a0105f0d75aa2ee --- /dev/null +++ b/full_models/key/vocab.txt @@ -0,0 +1,53 @@ +ఐ +ఙ +ీ +జ +శ +_ +త +క +చ +ె +వ +ఊ +స +‍ +ఁ +- +ష +ద +ప +గ +ఓ +ఈ +న +ఔ +ే +' +ల +ో +ం +ర +ఎ +బ +ఏ +ఆ +ు +ూ +ఫ +ౌ +ై +ఉ +ొ +ా +అ +య +హ +డ +ఇ +ఒ +మ +్ +ట + +ి diff --git a/full_models/kez/D_100000.pth b/full_models/kez/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a9a9c1b222772dbc3e608f020be723c88f2e8b75 --- /dev/null +++ b/full_models/kez/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19dc29f02dc48e1c3e2837856de70ec9444dd973859f22bbd63d8f54f594049e +size 561109972 diff --git a/full_models/kez/G_100000.pth b/full_models/kez/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e68eb29b95db7c95e6d44e61e06cbf4714609833 --- /dev/null +++ b/full_models/kez/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dba590425ce2c766e6224a7e6b664c4cdd16e5991c226f6a55d1c273b0cc44c2 +size 436641439 diff --git a/full_models/kez/config.json b/full_models/kez/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kez/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kez/vocab.txt b/full_models/kez/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7dcaeb6e34d74878bbf68c4b1c351899faceb4c6 --- /dev/null +++ b/full_models/kez/vocab.txt @@ -0,0 +1,50 @@ +| +a +ɔ +n +ɛ +k +l +b +t +g +i +m +u +e +y +s +w +p +o +z +f +d +v +- +̀ +j +r +h +c +́ +à +á +' +x +é +ú +ù +ì +è +q +– +0 +6 +— +í +ǹ +5 +ɜ +ń + diff --git a/full_models/kfb/D_100000.pth b/full_models/kfb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c7fa9ebdb97c109e5a79e47cc7bc67222267e272 --- /dev/null +++ b/full_models/kfb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93cc63aab6418f6d414fb403c86f4f221174927834b6e10aab486d215612d5e +size 561110250 diff --git a/full_models/kfb/G_100000.pth b/full_models/kfb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fd71e4d839bae24bdf24f08aad340674a302f653 --- /dev/null +++ b/full_models/kfb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e6365b1dec739799938da17aa63e4c81e03341d43ade0cb526c1c2f2e440d4 +size 436644416 diff --git a/full_models/kfb/config.json b/full_models/kfb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kfb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kfb/vocab.txt b/full_models/kfb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3bc57f979803102a70cf5b63e47674f25b89b460 --- /dev/null +++ b/full_models/kfb/vocab.txt @@ -0,0 +1,50 @@ +| +ा +न +् +े +त +क +ी +र +द +ु +‍ +म +आ +ग +ं +ल +स +व +प +ो +ट +य +ि +इ +ड +ळ +ए +ब +ज +ओ +श +ू +ई +उ +च +ै +अ +ौ +ऊ +' +ृ +- +० +४ +१ +६ +२ +७ + diff --git a/full_models/kff-script_telugu/D_100000.pth b/full_models/kff-script_telugu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0882228a9e92548483a04bd8a87f242b45785de8 --- /dev/null +++ b/full_models/kff-script_telugu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe7b6a684cd43e41ecfca976c15e6b5da7db742ad8ee26d92bcfe84a7427441 +size 561077999 diff --git a/full_models/kff-script_telugu/G_100000.pth b/full_models/kff-script_telugu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6a66ce9697b6c17d9ff62fc7bda5904f6eea51ed --- /dev/null +++ b/full_models/kff-script_telugu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f609bc5347a588c0c88b12d8d4d2be4cf2137da93dea566636d67bfa4431ba2 +size 436381565 diff --git a/full_models/kff-script_telugu/config.json b/full_models/kff-script_telugu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kff-script_telugu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kff-script_telugu/vocab.txt b/full_models/kff-script_telugu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fc9214d7b43ca64c99bba4ba7c963d80c40031bd --- /dev/null +++ b/full_models/kff-script_telugu/vocab.txt @@ -0,0 +1,41 @@ +| +ి +న +్ +ు +త +ా +క +ర +ం +ె +మ +ద +స +ో +గ +ప +ల +ట +వ +డ +య +ే +బ +ొ +జ +ఓ +అ +ీ +ఇ +చ +ఆ +ూ +ఈ +ఒ +ఊ +ఏ +ఎ +ఉ +- + diff --git a/full_models/kfw/D_100000.pth b/full_models/kfw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6ecaf1a1c88fe133a3f2b1a353f187f5e4594f5f --- /dev/null +++ b/full_models/kfw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faa6417ea7f298b5ef6ad039bf83885d206453b9defb1b44cac31049b46a168b +size 561078625 diff --git a/full_models/kfw/G_100000.pth b/full_models/kfw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9c18cbdf69d080f53c65c28f7f17b55630bad178 --- /dev/null +++ b/full_models/kfw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab978d617aa503c439578b86134227709a536903d5318d48d4caac51a3ce0f8 +size 436392154 diff --git a/full_models/kfw/config.json b/full_models/kfw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kfw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kfw/vocab.txt b/full_models/kfw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..15b0dd54bc3f8d1d97dadffee56811c5c3f31580 --- /dev/null +++ b/full_models/kfw/vocab.txt @@ -0,0 +1,43 @@ +t +_ +l +z +– +2 +x +­ +p +— +7 +i +6 +k +d +a +y +o +' +w +c +r +v +n +0 +9 +b +u +q +f +j +m +- +8 +5 +e +4 + +g +1 +h +3 +s diff --git a/full_models/kfx/D_100000.pth b/full_models/kfx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5dae31058fb9848b0ade08313dec5556f4bc43d0 --- /dev/null +++ b/full_models/kfx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06141412cc34e8b7be4e9858d1fdd5374ebb7675437c9d1968d7b51ab00c55bf +size 561078605 diff --git a/full_models/kfx/G_100000.pth b/full_models/kfx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ba3348e2125d8205df9a0ed0a3955b2329cfd87b --- /dev/null +++ b/full_models/kfx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a102f55a5330d4e90def3c4656a12305edd2121ca446553b88f056b3835937d +size 436440679 diff --git a/full_models/kfx/config.json b/full_models/kfx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kfx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kfx/vocab.txt b/full_models/kfx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..33edd777698e4539007be21ef1273ba377ce365d --- /dev/null +++ b/full_models/kfx/vocab.txt @@ -0,0 +1,65 @@ +| +ा +ै +र +ी +स +त +ह +क +न +ि +ब +् +े +ो +़ +ु +ं +म +ल +प +ज +ण +द +य +श +आ +ू +ौ +ग +ई +व +भ +ऐ +ँ +ध +च +ख +ड +इ +ऊ +घ +ए +ढ +ट +छ +थ +अ +फ +ठ +झ +ष +- +औ +उ +ऑ +ओ +ः +ञ +ृ +ऋ +' +– +‍ + diff --git a/full_models/khg/D_100000.pth b/full_models/khg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7a8dfe20ece78d76acb8cc5d1ec57d91c9c25603 --- /dev/null +++ b/full_models/khg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c68ad01b65006d8b229d5616f976bca980caff894c54bfb0580bb7e677930f +size 561078983 diff --git a/full_models/khg/G_100000.pth b/full_models/khg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..99c416d7af1484a4b1e9b81fc5718892701afd6e --- /dev/null +++ b/full_models/khg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf48428b247ea5ccdbefeec40c28a9d09eac5f80c6c2aa0435423dac92c5a83 +size 436428853 diff --git a/full_models/khg/config.json b/full_models/khg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/khg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/khg/vocab.txt b/full_models/khg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ee7084a57a2474c49081ae9886549c6627506934 --- /dev/null +++ b/full_models/khg/vocab.txt @@ -0,0 +1,59 @@ +མ +_ +ྱ +ཀ +ཆ +ག +ད +ཨ +ཐ +ྟ +ཤ +ཙ +ྕ +ོ +ྫ +ི +ལ + +ཟ +ྙ +ཡ +ཏ +ཁ +ྤ +ྦ +ང +ྐ +ན +ྭ +ཪ +ུ +ྲ +ྷ +ྒ +ྗ +ཞ +ར +ཅ +ྣ +ླ +པ +ྨ +འ +ྡ +ཱ +ཕ +ཊ +བ +ཉ +ྩ +་ +ཚ +ེ +ས +ཇ +ྔ +ཛ +ཝ +ཧ diff --git a/full_models/khm/D_100000.pth b/full_models/khm/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f1e4abd96907f86712595280756ba5d41b78ed3 --- /dev/null +++ b/full_models/khm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:984ab377966f62d156639d5f2af3edbcac54014f307cd5a500625cb1efa099be +size 561078755 diff --git a/full_models/khm/G_100000.pth b/full_models/khm/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..168761fb62ca0dc3e2ded270c9e66ba6c5249f8f --- /dev/null +++ b/full_models/khm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a7237c6bd72beb885152631e69743290c03b4a33ea17b7c3ca851a29b9749d +size 436464113 diff --git a/full_models/khm/config.json b/full_models/khm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/khm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/khm/vocab.txt b/full_models/khm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1dee5053bc85d9f1ea727781660472da1a42370e --- /dev/null +++ b/full_models/khm/vocab.txt @@ -0,0 +1,74 @@ +្ +យ +អ +ឆ +គ +ង +ើ +ធ +់ +ឃ +ឌ +ឥ +ប +ួ +ឈ +q +៏ +ផ +ិ + +ជ +ឧ +ល +ឱ +ទ +ូ +រ +៎ +ឭ +ា +ៀ +ឿ +េ +ំ +៍ +ត +_ +៉ +ក +ែ +ៅ +ៃ +ដ +វ +ៈ +ឬ +ឫ +ះ +ោ +ី +ុ +ឯ +ព +ឡ +ច +ឋ +ណ +1 +ហ +ន +ឹ +ស +ខ +័ +ញ +៊ +ឮ +៌ +ថ +ឺ +ឪ +- +ម +ភ diff --git a/full_models/khq/D_100000.pth b/full_models/khq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f4d53bf8f1a3797aa0ac8a301c05662aac27773e --- /dev/null +++ b/full_models/khq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11434febfe18d4e931d9a19ebd25ea8f3d0ee4a5759fa5b6f30f877713399687 +size 561079477 diff --git a/full_models/khq/G_100000.pth b/full_models/khq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9d009c58cd2b9313917528d3e7d95b1cfe230b53 --- /dev/null +++ b/full_models/khq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f42ebd3d597c92b9666b3ae04a8967f4729ca141f56381f3b601b352c71a3bf +size 436380365 diff --git a/full_models/khq/config.json b/full_models/khq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/khq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/khq/vocab.txt b/full_models/khq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d1eb387fa7fcd1cc15a594ab0eb6e4cd5dca639b --- /dev/null +++ b/full_models/khq/vocab.txt @@ -0,0 +1,36 @@ +n +k +– +i +d +' +g +b +z +c +ɲ +j +o +f +r +a +š +ã + +s +t +h +ẽ +l +ŋ +p +ĩ +e +ž +y +_ +- +õ +m +u +w diff --git a/full_models/kia/D_100000.pth b/full_models/kia/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..16b8596400b397491ac47d65ddded518e7f4408d --- /dev/null +++ b/full_models/kia/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca45ad14f016f36939c10a1033eafaaa1077bbcd0fd08d847259aafffe8c2c93 +size 561078872 diff --git a/full_models/kia/G_100000.pth b/full_models/kia/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d8d783abfc0402e115987d2e38ebfd60db5f5198 --- /dev/null +++ b/full_models/kia/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2914eca69e1101bb111e69f3ea518a411c2c47014437790e643c261b3c7f9734 +size 436400974 diff --git a/full_models/kia/config.json b/full_models/kia/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kia/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kia/vocab.txt b/full_models/kia/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f07a6a84df226e5c7f63846fac83db7082dcbed4 --- /dev/null +++ b/full_models/kia/vocab.txt @@ -0,0 +1,46 @@ +à +ɓ +d +f +m +b +z +c +ù +h +n +ɗ +p +á +ó +g +ŋ +ú +k +l +s +v +ò +ḛ +' +y +é +̰ + +u +ṵ +_ +r +ū +́ +ḭ +- +a +w +e +j +í +o +è +i +t diff --git a/full_models/kij/D_100000.pth b/full_models/kij/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fdcd5f9f127b5a00ad5c6e1af0c248c97c61980c --- /dev/null +++ b/full_models/kij/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98fa4ac14b9958b047e268aeadee86d7d60dcfe942577a398af23ebfc4e1cd17 +size 561078752 diff --git a/full_models/kij/G_100000.pth b/full_models/kij/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8883066d4c63b00138981e3349aa5474213a93ef --- /dev/null +++ b/full_models/kij/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32776d297004feae2eb34c8689e8e687bad32de38ebcee6f394178277dc88973 +size 436373369 diff --git a/full_models/kij/config.json b/full_models/kij/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kij/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kij/vocab.txt b/full_models/kij/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..608f7650bd3d46f3ee7505d722851db8bb5fc756 --- /dev/null +++ b/full_models/kij/vocab.txt @@ -0,0 +1,35 @@ +i +0 +á +6 +w +y +d +t +é +k +g +s +e +- +_ +1 +p +n +8 +b +r +5 +2 +f + +l +v +o +' +a +` +m +ó +u +4 diff --git a/full_models/kik/D_100000.pth b/full_models/kik/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ce6d6c5368650a4c51b680d8b6fa79cfbac217f5 --- /dev/null +++ b/full_models/kik/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed906e211315a684bdc05f91a3029570179072015d4d01822bfe4b44e804ad70 +size 561079479 diff --git a/full_models/kik/G_100000.pth b/full_models/kik/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..99d6b0dd98b71d5c0d95f163ae5a79f113a19367 --- /dev/null +++ b/full_models/kik/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6701df59039309b061afef8ff910b48905d7af8adb1ea71a47bc3d11f2f695e5 +size 436382624 diff --git a/full_models/kik/config.json b/full_models/kik/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kik/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kik/vocab.txt b/full_models/kik/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6b3cc20445e5e9c6c89fa68c750ddb13b484cb3e --- /dev/null +++ b/full_models/kik/vocab.txt @@ -0,0 +1,37 @@ +ũ +t +5 +h +1 +w +a +4 +n +j +ʼ +o +v +i +ĩ +_ +2 +m +k +0 +c +s +e +q +- +p +y +u +g +' + +d +b +r +z +f +l diff --git a/full_models/kin/D_100000.pth b/full_models/kin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2753e661171d44a025005c5a48d780def699ee72 --- /dev/null +++ b/full_models/kin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c2aa9e11f9a770c3cbc15251f59a95de117fbf2e93dd7327d77c61ae66035c +size 561109743 diff --git a/full_models/kin/G_100000.pth b/full_models/kin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3520c872a86908e291248d8dc76e0e47a9f43e2b --- /dev/null +++ b/full_models/kin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef6d182b833d4b73280ccefdff2638e7a20a185b3cfcbcc68c05efe22d8ea6b +size 436627594 diff --git a/full_models/kin/config.json b/full_models/kin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kin/vocab.txt b/full_models/kin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d7e228036eeccf0f1db297e6dad2f19f1cf8ee18 --- /dev/null +++ b/full_models/kin/vocab.txt @@ -0,0 +1,44 @@ +| +a +i +u +e +n +b +r +m +o +y +k +w +g +t +s +h +z +d +' +f +c +j +v +p +l +7 +1 +- +2 +3 +4 +6 +9 +8 +5 +0 +ē +ō +ā +ī +` +ū + diff --git a/full_models/kir/D_100000.pth b/full_models/kir/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..751dbf017b1eb1e6df17061fac394296a05a5080 --- /dev/null +++ b/full_models/kir/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40e4888f87f4ca9bb7fea74807c012e26d41eb41091ff095bd751b3dff17a072 +size 561078847 diff --git a/full_models/kir/G_100000.pth b/full_models/kir/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..57792099f6966fb409b27b5ca5c12b7dc5876d27 --- /dev/null +++ b/full_models/kir/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5831fbc3ed071d045c8ef91533f51d466222948d12567f115d2c165193ecc036 +size 436380693 diff --git a/full_models/kir/config.json b/full_models/kir/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kir/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kir/vocab.txt b/full_models/kir/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..56983f3df53a4b2f48a674c34069b890a41e5c44 --- /dev/null +++ b/full_models/kir/vocab.txt @@ -0,0 +1,38 @@ +ж +ц +ө +– +и +ы +ю +я +е +о +й +л +у +- + +ү +_ +ң +э +а +д +т +с +н +р +ш +к +з +х +ё +б +в +п +ч +ь +г +м +ф diff --git a/full_models/kjb/D_100000.pth b/full_models/kjb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d43c0749d91ac681de7c0660ff4ddc51a83cc131 --- /dev/null +++ b/full_models/kjb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7743a0c3fced472174757a68cdc0863d826fba125759eb32cea0b4a6d5d3f29e +size 561109749 diff --git a/full_models/kjb/G_100000.pth b/full_models/kjb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..39c753997d665b1ec9a73bafc1b469e8e6eeaae2 --- /dev/null +++ b/full_models/kjb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ceeb1e0eff8d19d56028ea09be06b4c69acb36886f3ca7837af7482165ab14 +size 436636808 diff --git a/full_models/kjb/config.json b/full_models/kjb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kjb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kjb/vocab.txt b/full_models/kjb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fa4fe11c22c718a6147b43af31209073defba863 --- /dev/null +++ b/full_models/kjb/vocab.txt @@ -0,0 +1,48 @@ +| +a +i +n +t +c +l +e +y +o +' +j +u +b +x +k +m +h +s +w +p +z +r +d +ẍ +q +ú +g +— +í +é +á +f +- +ó +v +0 +1 +2 +4 +5 +3 +9 +6 +7 +8 +ñ + diff --git a/full_models/kje/D_100000.pth b/full_models/kje/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4710433ba9b570d2250cdba2134d340a2b7150d4 --- /dev/null +++ b/full_models/kje/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b7a7fa919023804262c655d06934a02562c7cf5619e087f01885735e2e810da +size 561078996 diff --git a/full_models/kje/G_100000.pth b/full_models/kje/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d11abf2dbff45fff3f7b54c99c38b59867ae3f0d --- /dev/null +++ b/full_models/kje/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584b74312c6b526a97e5d638ca5ff5efb77a151861ad355641e049ad5ac7b3b4 +size 436354102 diff --git a/full_models/kje/config.json b/full_models/kje/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kje/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kje/vocab.txt b/full_models/kje/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1caa4fab92b1ea4917d94c5a14ba8056c5ca75e9 --- /dev/null +++ b/full_models/kje/vocab.txt @@ -0,0 +1,27 @@ + +f +k +h +s +z +o +_ +r +i +a +g +c +b +e +j +- +w +d +u +n +m +y +t +l +' +p diff --git a/full_models/kjg/D_100000.pth b/full_models/kjg/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..29edce0ef2e54980e13e64d4d27118c8429e59f7 --- /dev/null +++ b/full_models/kjg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d27f0e9d8fb3cb7a23d99023487ed371a96471d39e8e8a888c5e19c79cd7579 +size 561076053 diff --git a/full_models/kjg/G_100000.pth b/full_models/kjg/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..10957221ad817add6305c4e34abc701b7b388a2c --- /dev/null +++ b/full_models/kjg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:023fd5dbec287f79a54b9bf9007694acd47a46d77e66a29db5052112b28f0acd +size 436350241 diff --git a/full_models/kjg/config.json b/full_models/kjg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kjg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kjg/vocab.txt b/full_models/kjg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..50dfccc2c1880af0b647de64be7ffbfe5bd31a31 --- /dev/null +++ b/full_models/kjg/vocab.txt @@ -0,0 +1,34 @@ +| +a +n +' +h +g +o +m +y +r +ô +t +i +l +k +w +u +s +e +é +p +c +è +d +b +v +ñ +j +- +ê +f +2 +0 + diff --git a/full_models/kjh/D_100000.pth b/full_models/kjh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f68cd91bd0ae59155cf9ae6fe362514bb3d17b03 --- /dev/null +++ b/full_models/kjh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea7a67b4ce68b022fc4dd7ba455f8e056b15dcdd607e35d337eb8c8945f19aa +size 561079249 diff --git a/full_models/kjh/G_100000.pth b/full_models/kjh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0fb1e5d59f7a14723a85af92f2752c3893aedc46 --- /dev/null +++ b/full_models/kjh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05393ed516d2e2accb675ebabba33ce3f8059feb445706b55f32d0e73112b40 +size 436400509 diff --git a/full_models/kjh/config.json b/full_models/kjh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kjh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kjh/vocab.txt b/full_models/kjh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..02a9059cb1f0d524f3ebda0d3c79017a755b9018 --- /dev/null +++ b/full_models/kjh/vocab.txt @@ -0,0 +1,46 @@ +ч +0 +р +і +ь +ы +ц +з +а +_ +х +и +с +м +е +л +ф +к +ң +4 + +́ +т +э +б +ӧ +г +н +1 +о +ш +– +ҷ +й +я +у +ю +ё +д +в +- +п +ӱ +2 +6 +ғ diff --git a/full_models/kki/D_100000.pth b/full_models/kki/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1c824595e3dc8894c9c12dac7286eddc11e2a0a --- /dev/null +++ b/full_models/kki/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb9a0e0db4ece1409651cca099dd0c0d2720aa1e725e2827766aaaf9c14f7789 +size 561110252 diff --git a/full_models/kki/G_100000.pth b/full_models/kki/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dc0d7ba2a11216731c783afb43979c15273d701c --- /dev/null +++ b/full_models/kki/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0813d6a4acf8898d9597f41976891cb7e21ba722c20b629511f8a9e3a149e5b2 +size 436595937 diff --git a/full_models/kki/config.json b/full_models/kki/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kki/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kki/vocab.txt b/full_models/kki/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..296295e817e4fbf720aecc7c30863386ed340226 --- /dev/null +++ b/full_models/kki/vocab.txt @@ -0,0 +1,29 @@ +| +a +i +u +n +e +o +w +k +m +l +h +g +y +s +d +f +t +c +b +j +p +' +v +2 +q +- +1 + diff --git a/full_models/kkj/D_100000.pth b/full_models/kkj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c5175298758e33b66264ff20d3d22a6c1b0ea6b1 --- /dev/null +++ b/full_models/kkj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b22535520dc5130d2bcd50774c23d2c4ec763092ffa5dfa49ae0d3ab38a6269 +size 561109878 diff --git a/full_models/kkj/G_100000.pth b/full_models/kkj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..42db07a17c175404cbe5a6c92b3255b0145d1ad9 --- /dev/null +++ b/full_models/kkj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b858cd25a1c331c4a5d6e896eb2ae3a3f1e55114566cc5f9f7fbd2299fa13cbb +size 436620690 diff --git a/full_models/kkj/config.json b/full_models/kkj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kkj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kkj/vocab.txt b/full_models/kkj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2a758f3f809c5080fe6f10e7a6980d6f8afd6d16 --- /dev/null +++ b/full_models/kkj/vocab.txt @@ -0,0 +1,41 @@ +| +á +a +n +e +m +k +y +i +t +ó +ä +u +s +o +w +ñ +d +b +l +j +ë +g +p +à +ã +r +h +ï +ê +è +' +ù +î +ì +f +v +õ +1 +- + diff --git a/full_models/kle/D_100000.pth b/full_models/kle/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3c13299776e02432087afc396df709531e99db50 --- /dev/null +++ b/full_models/kle/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014b422f1daaac74d9273b1469d1e154e8349f87dd73d232ec55674f9a44b008 +size 561079248 diff --git a/full_models/kle/G_100000.pth b/full_models/kle/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..860eae93c5fef968a249995c643cdcf756e0c80b --- /dev/null +++ b/full_models/kle/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f2dee6ca5d118ed4f0726c2a044ee429922ca42e710397ee53f35f12632e404 +size 436440088 diff --git a/full_models/kle/config.json b/full_models/kle/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kle/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kle/vocab.txt b/full_models/kle/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..15a9187f4034c6d15f031cf99a0de5254bb31cd6 --- /dev/null +++ b/full_models/kle/vocab.txt @@ -0,0 +1,63 @@ +ू +ध +अ +् +उ +ऋ +े +स +च +ई +ष +ल +भ +ण +घ +ु +ए +ँ +ो +ह +व + +ङ +ज +- +ै +इ +य +ी +ञ +ड +' +ठ +ऊ +ट +ढ +ग +त +ः +न +फ +ा +छ +प +श +ौ +ख +क +‍ +आ +झ +ब +द +ृ +र +थ +ि +ं +_ +ऐ +म +ओ +– diff --git a/full_models/klu/D_100000.pth b/full_models/klu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5662e3ceaf0eaf33c993f6fe795b28b58ff30b4e --- /dev/null +++ b/full_models/klu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0edc5b3a0d4e76f1d9aa011d2a498136663a08b17b2009bd4e6e85186bd1f2b8 +size 561109884 diff --git a/full_models/klu/G_100000.pth b/full_models/klu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d282e63e2c8ed4b2e002bfafc84f8cdcc6b4983a --- /dev/null +++ b/full_models/klu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4fc280f33f77df7770394d1f0a9c37275f4222be8b4074f88945e9e8670058e +size 436641298 diff --git a/full_models/klu/config.json b/full_models/klu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/klu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/klu/vocab.txt b/full_models/klu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..243fa1a2c5e32239275b4ffd42df4d8298328cee --- /dev/null +++ b/full_models/klu/vocab.txt @@ -0,0 +1,50 @@ +| +̍ +n +a +e +ɛ +l +ɔ +o +i +k +‐ +t +y +b +s +u +m +h +j +w +p +̀ +d +â +è +ê +˖ +ô +ò +̂ +à +ì +î +f +ù +g +û +c +ˆ +ˈ +ǔ +- +ě +ǐ +ǎ +' +̌ +ǒ + diff --git a/full_models/klv/D_100000.pth b/full_models/klv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff5a85681124a68efeb85d72cadd20e7ce7d7fe9 --- /dev/null +++ b/full_models/klv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:271d0e6a35b435b8cc0f9db8398fe0105046ecb1f7858e7ffc6a0c1850454f09 +size 561079115 diff --git a/full_models/klv/G_100000.pth b/full_models/klv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..66d2f9ff1e6c17504e867a68eb394b3ff590b083 --- /dev/null +++ b/full_models/klv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f81efb39e2139a16f484fe86ad72d5fa490b9ddc4e146040cf761992d876d43 +size 436388060 diff --git a/full_models/klv/config.json b/full_models/klv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/klv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/klv/vocab.txt b/full_models/klv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..31e63b7a817a7d29fe76b13ee3f0d55aa53e39b5 --- /dev/null +++ b/full_models/klv/vocab.txt @@ -0,0 +1,41 @@ +w +s +v +_ +d +j +y +k +0 +b +o +p +̃ +' +— +1 +m +- +u +3 +a +g +ǝ +6 +2 +l +7 +e +4 +f +ŋ +ṽ +8 +n + +h +i +t +5 +r +9 diff --git a/full_models/klw/D_100000.pth b/full_models/klw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b33d9d3a36fa4b0e1c153af3fd7eaf01d1c4198 --- /dev/null +++ b/full_models/klw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9cb2c1151a8c06919f593cf69d466478a8f25d5981099fe4c2c11b88015a19e +size 561076026 diff --git a/full_models/klw/G_100000.pth b/full_models/klw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..affd14d86568a2393944492e93ae402274c783ac --- /dev/null +++ b/full_models/klw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b774108bd2ff677db8ff531d2a71512bef8296911ebd058e3090b13f566ac1 +size 436333659 diff --git a/full_models/klw/config.json b/full_models/klw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/klw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/klw/vocab.txt b/full_models/klw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9e8b94f44d8d183552f9e23577a6c205c6b5fdef --- /dev/null +++ b/full_models/klw/vocab.txt @@ -0,0 +1,27 @@ +w +h +o +b +g +y +d + +' +a +s +j +f +i +- +n +e +c +m +t +r +l +u +_ +k +p +z diff --git a/full_models/kma/D_100000.pth b/full_models/kma/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4182ef07de259ad5518e9156eaea5d566842f5ce --- /dev/null +++ b/full_models/kma/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5274e96b3852f26c09005756079da63a84ba32539b97bdc2c822b0fd4b7fae +size 561109883 diff --git a/full_models/kma/G_100000.pth b/full_models/kma/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e463487f7fe421a44e8f8887eeccf01fd8ccf352 --- /dev/null +++ b/full_models/kma/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ec025c4bffbb31088985f943390c9360a921e23b0aa08da3ecaeef50ab3d81 +size 436600600 diff --git a/full_models/kma/config.json b/full_models/kma/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kma/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kma/vocab.txt b/full_models/kma/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5e9b091a0c873a4a0afa9e0ad16c2c6638fb198e --- /dev/null +++ b/full_models/kma/vocab.txt @@ -0,0 +1,32 @@ +| +a +ɩ +i +ŋ +n +e +d +m +b +ʊ +t +k +y +s +g +w +l +u +o +r +v +h +ɔ +p +j +c +f +z +- +' + diff --git a/full_models/kmd/D_100000.pth b/full_models/kmd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cc2a4f951126c63e6025f939ba28036664a9aa00 --- /dev/null +++ b/full_models/kmd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21efb20c23f7f0d68f08961a7f1715315a7221c5e72f0cbee96861763b0eaa36 +size 561079116 diff --git a/full_models/kmd/G_100000.pth b/full_models/kmd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..67bee738597c5e88a13910971107c41ebb03c329 --- /dev/null +++ b/full_models/kmd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9882a9380cb33eaa907072592d1922bd1bfa806c7af7cf9278f145095868089 +size 436377392 diff --git a/full_models/kmd/config.json b/full_models/kmd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kmd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kmd/vocab.txt b/full_models/kmd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..93fb4e078c69d82dd3d73f2e84872c710135c0fb --- /dev/null +++ b/full_models/kmd/vocab.txt @@ -0,0 +1,37 @@ +p +ꞌ +- +h +n +x +q +t + +_ +e +d +é +y +l +k +g +4 +c +s +o +z +w +0 +ʼ +m +f +1 +u +i +v +a +j +' +r +b +6 diff --git a/full_models/kml/D_100000.pth b/full_models/kml/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ac8c008c9863ff5df7b1d62a2c18c41062139749 --- /dev/null +++ b/full_models/kml/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631313ac82e6476edd42e01cc5b724510f87e2272eac6c8656f1207ddd8e7f53 +size 561078891 diff --git a/full_models/kml/G_100000.pth b/full_models/kml/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1cb5e6d9015f614fa4c9fc4958f7647946bc96d9 --- /dev/null +++ b/full_models/kml/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:120a32f6e4d4ed98c3a119677ced639e8c7e3b86444a40eeadc8066cc667351e +size 436367146 diff --git a/full_models/kml/config.json b/full_models/kml/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kml/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kml/vocab.txt b/full_models/kml/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8a89065a380c909304ea20b30b3713d7b4a1f826 --- /dev/null +++ b/full_models/kml/vocab.txt @@ -0,0 +1,32 @@ +e +_ +d +f +t +' +n +j +y +ḵ +h +r +q +o +b +w +u +- +s +g +m +p +k +z +l +ḻ +c +v +x + +a +i diff --git a/full_models/kmr-script_arabic/D_100000.pth b/full_models/kmr-script_arabic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1ed00f11c61ffba8aa70d1653b283f67e5785bb --- /dev/null +++ b/full_models/kmr-script_arabic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e2a714ab275a2e620c6841fdfdb419285964c3a0d30900b09042d2984f0320 +size 561078995 diff --git a/full_models/kmr-script_arabic/G_100000.pth b/full_models/kmr-script_arabic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..571c90a375e197fca5ccf6fb3cf45f6aa588bfb2 --- /dev/null +++ b/full_models/kmr-script_arabic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff4e2e3a2ba56dd02353abaa1f76081bdc14558a952438de9ed4fb552f516e2d +size 436382625 diff --git a/full_models/kmr-script_arabic/config.json b/full_models/kmr-script_arabic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kmr-script_arabic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kmr-script_arabic/vocab.txt b/full_models/kmr-script_arabic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..59ccee3770f1380b7687de3708ab2951678de4e2 --- /dev/null +++ b/full_models/kmr-script_arabic/vocab.txt @@ -0,0 +1,38 @@ +| +ە +ا +ی +ن +و +ێ +ر +د +ب +ك +ت +م +ه +ل +س +ئ +ۆ +ڤ +خ +گ +ژ +ز +ش +پ +چ +ج +ڕ +ف +ح +ق +ع +ڵ +غ +m +b +c + diff --git a/full_models/kmr-script_cyrillic/D_100000.pth b/full_models/kmr-script_cyrillic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..feac5b496f5a9c64e9b63bc72a1572b991d1cf03 --- /dev/null +++ b/full_models/kmr-script_cyrillic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce876d331763413d9181edbd89c20bf23b8cf6d08bd7ec9acab828519b04d8f +size 561078471 diff --git a/full_models/kmr-script_cyrillic/G_100000.pth b/full_models/kmr-script_cyrillic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bff7403fe1e57b5abbee37bbf81bf872f224f5b4 --- /dev/null +++ b/full_models/kmr-script_cyrillic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b26c472f770cad34b19811506884fc079c8e7273f92e64ee1251befbfeef6222 +size 436370939 diff --git a/full_models/kmr-script_cyrillic/config.json b/full_models/kmr-script_cyrillic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kmr-script_cyrillic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kmr-script_cyrillic/vocab.txt b/full_models/kmr-script_cyrillic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cfb936f5d8fecbc2489bbef00cc460aabedf8de0 --- /dev/null +++ b/full_models/kmr-script_cyrillic/vocab.txt @@ -0,0 +1,35 @@ +| +ә +а +ь +н +е +р +и +д +к +б +w +' +т +м +й +у +һ +с +х +л +ӧ +в +г +ж +о +з +ш +п +ч +q +щ +ф +- + diff --git a/full_models/kmr-script_latin/D_100000.pth b/full_models/kmr-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fb9a91e80b30860fb7cd49d5f74339d7d56171a2 --- /dev/null +++ b/full_models/kmr-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ae03f6c025ac37b6a8f87dbbc57239a42cf5f74f72e52078974e652ce422298 +size 561079341 diff --git a/full_models/kmr-script_latin/G_100000.pth b/full_models/kmr-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..53487a172dfb21ec95dbbe0e191bdd37fd76bd4b --- /dev/null +++ b/full_models/kmr-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b9b2a4963f955ec496c7cca059d02b4586795ad086e964d73f0c1746326ad91 +size 436375528 diff --git a/full_models/kmr-script_latin/config.json b/full_models/kmr-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kmr-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kmr-script_latin/vocab.txt b/full_models/kmr-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..80e9e2006bc9e95e6d191e917c4987110d571f55 --- /dev/null +++ b/full_models/kmr-script_latin/vocab.txt @@ -0,0 +1,35 @@ +n +h +ş +ê +e +p +c +x +w +j +d +s +ç +- +o +î +m +û +k +l +a +b +_ +z +' +u +f +v +q + +y +t +i +g +r diff --git a/full_models/kmu/D_100000.pth b/full_models/kmu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ddfb947cc70e4262a35565f101130ad6c4d299f8 --- /dev/null +++ b/full_models/kmu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f11d2eb172f33b62a33a9d84b60da59a4c0efb06bca99d9dd598cdab48609a7 +size 561078585 diff --git a/full_models/kmu/G_100000.pth b/full_models/kmu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6ffef69d8098b0dfa0e31aae46fd66071eb37e53 --- /dev/null +++ b/full_models/kmu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781bd3a9217949cb8861d0e246b20fd16b92c14a3e3f95a3c3b223ac20e20346 +size 436338867 diff --git a/full_models/kmu/config.json b/full_models/kmu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kmu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kmu/vocab.txt b/full_models/kmu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..60c6e2a6f513efd54cd7615624ce0bdea98bd228 --- /dev/null +++ b/full_models/kmu/vocab.txt @@ -0,0 +1,21 @@ + +t +u +ꞌ +_ +e +l +n +h +g +a +v +i +s +o +y +p +m +k +- +f diff --git a/full_models/knb/D_100000.pth b/full_models/knb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dae5dbbf1091542f8ee405adcaa6f94458880054 --- /dev/null +++ b/full_models/knb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e3b85df42f53f48e44e38a45a97304721a8b3adceee7eb6c5733bf7b2af9d51 +size 561078870 diff --git a/full_models/knb/G_100000.pth b/full_models/knb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4d15ebd87ba1de09b9d702b3781c50a789be5d61 --- /dev/null +++ b/full_models/knb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07238f0f877f2316d58796760a90447b28d74a7dcebdd981f3c01080d3ba6fe2 +size 436389807 diff --git a/full_models/knb/config.json b/full_models/knb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/knb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/knb/vocab.txt b/full_models/knb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..df9b21d0ad98ca333f78ecec21aacf732c08821a --- /dev/null +++ b/full_models/knb/vocab.txt @@ -0,0 +1,42 @@ +g +q +ù +l +ì +o +c +t +v +b +- +_ +x +r +w +ɏ +j +e +a +6 +s +d +' +i +ʼ +f +m +k +à +2 +1 +z +p +4 +h +0 +è +n +ò +y +u + diff --git a/full_models/kne/D_100000.pth b/full_models/kne/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e28a76489817d0d15216a183fdc3c18ae93ae343 --- /dev/null +++ b/full_models/kne/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a232c5eba646187778638ee4b62898830f1952bcf81d974b6d54cf79862f4f19 +size 561078972 diff --git a/full_models/kne/G_100000.pth b/full_models/kne/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..40bd3629a08646cd80d81194e999b1b472d43a93 --- /dev/null +++ b/full_models/kne/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e7674844ad48839cb543160d705c1fde7184ba2e95ade513d6b21bb9417bad6 +size 436371882 diff --git a/full_models/kne/config.json b/full_models/kne/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kne/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kne/vocab.txt b/full_models/kne/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..61112fba3055abd8fda051e2bbac9bca2d7a8af5 --- /dev/null +++ b/full_models/kne/vocab.txt @@ -0,0 +1,34 @@ +u +4 +o +_ +w +b +0 +f +m +i +c +g +z +e +l +x +k +n +t +a +s +q +r +j +3 +p +y +1 +v +d + +- +' +h diff --git a/full_models/knf/D_100000.pth b/full_models/knf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d0d2f1fbe369eddd22275358d1819015a6456542 --- /dev/null +++ b/full_models/knf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c7075b1b6d9f65b0e7ac25ea5da717aa737242e217e94bff7de08a2099ce68 +size 561078891 diff --git a/full_models/knf/G_100000.pth b/full_models/knf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9eaa6ae01d242f231c03bc61a4c0be2c17f5d458 --- /dev/null +++ b/full_models/knf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b334d3aa18e238be33067c33a749cf5ced0337da680d9f3a5d267e08f123a716 +size 436367304 diff --git a/full_models/knf/config.json b/full_models/knf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/knf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/knf/vocab.txt b/full_models/knf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3593ffd9d023f21498e3fa96132a23d1c30b2c45 --- /dev/null +++ b/full_models/knf/vocab.txt @@ -0,0 +1,32 @@ +k +ë +– +e +ş +u +b +' +i +j +y +o +ŋ +ñ +t +_ +l +d +ŧ +m +a +g +ţ +p +- +n + +w +h +c +r +f diff --git a/full_models/knj/D_100000.pth b/full_models/knj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..86b2db95edfd8c92bf026551afb79d7df27d5e97 --- /dev/null +++ b/full_models/knj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3887e777965fa43cdd1a217d5042ae506fe781068ed2cdf70f07767ed0fdfaab +size 561109858 diff --git a/full_models/knj/G_100000.pth b/full_models/knj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fefb6b8b672c14e1156251991edb41049573fd88 --- /dev/null +++ b/full_models/knj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a75fb7f6d3a7898d7edcf8892c3bb64ce1201e5d4bb891c950b499c5f44d9b +size 436611348 diff --git a/full_models/knj/config.json b/full_models/knj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/knj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/knj/vocab.txt b/full_models/knj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9ec9e75704941afa82e1af0cb72ce4d7181907b1 --- /dev/null +++ b/full_models/knj/vocab.txt @@ -0,0 +1,37 @@ +| +a +e +i +n +j +t +c +' +l +o +y +u +x +s +b +m +h +w +k +p +r +d +z +ẍ +q +ú +á +g +— +í +é +v +- +f +ó + diff --git a/full_models/knk/D_100000.pth b/full_models/knk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4af9fcc762f6677d8de80f66845d980726da51a1 --- /dev/null +++ b/full_models/knk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51bad66fa1e65ff2f8d755db85458b2263c462fb210c599a8736658bf133e00 +size 561110004 diff --git a/full_models/knk/G_100000.pth b/full_models/knk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..53d508f0075e6820eb4ea34ff72168c7a8a69cb0 --- /dev/null +++ b/full_models/knk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be97f684f3f9496f56c17c0219bd5ff66578cec2f3474542f5c6b4571474b3bd +size 436589204 diff --git a/full_models/knk/config.json b/full_models/knk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/knk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/knk/vocab.txt b/full_models/knk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a60ca49d88db8e0bdbe537b0e9b0a8fcd56d2dc5 --- /dev/null +++ b/full_models/knk/vocab.txt @@ -0,0 +1,27 @@ +| +a +n +i +ɛ +l +k +o +m +ɔ +y +u +e +b +r +w +t +s +d +g +- +f +h +p +c +' + diff --git a/full_models/kno/D_100000.pth b/full_models/kno/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e10f229886ce5a9af757a55be084af3f223ca1b3 --- /dev/null +++ b/full_models/kno/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efd97e4e252fb5198357e1dcfb16d7009e39c01a176a5914daa378a344160864 +size 561109759 diff --git a/full_models/kno/G_100000.pth b/full_models/kno/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20ceade3953c05c63e89eb48a9211c75bfebf82b --- /dev/null +++ b/full_models/kno/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d386310c745d084dda38cd03d0ce1feb1ae01d9c334d85307d75a76ec93b7c0c +size 436583734 diff --git a/full_models/kno/config.json b/full_models/kno/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kno/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kno/vocab.txt b/full_models/kno/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cfab03b77506e170ec7f96733e62ce640a85c48c --- /dev/null +++ b/full_models/kno/vocab.txt @@ -0,0 +1,25 @@ +| +a +n +m +ɛ +i +ɔ +e +b +o +c +h +k +s +d +t +u +y +w +‐ +f +g +' +p + diff --git a/full_models/kog/D_100000.pth b/full_models/kog/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0e2cf37c70000d32f7e55e0f0bf36dd49e7b0058 --- /dev/null +++ b/full_models/kog/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45332fd643e9d8d9d631be113be91c482c6942ac4e2188b0cb5418ab855dafd5 +size 561078482 diff --git a/full_models/kog/G_100000.pth b/full_models/kog/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3398445ec285dcc6f3df2d9cc010acf03dfe814d --- /dev/null +++ b/full_models/kog/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e4de76a11d439b931add005c61fe7e17808d34b7876f90aaaf4a72f9f26848 +size 436394273 diff --git a/full_models/kog/config.json b/full_models/kog/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kog/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kog/vocab.txt b/full_models/kog/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..347cd9a6a6cf6d1d25296606f6af3a9ed03b44df --- /dev/null +++ b/full_models/kog/vocab.txt @@ -0,0 +1,45 @@ +x +' +c +_ +ʉ +l +d +í +g +a +i +ñ +p +ó +o +́ +3 +ã +y +2 +z +— +4 +0 +s +ú +n +1 +u +h +e + +6 +t +8 +j +5 +m +w +b +7 +á +é +k +9 diff --git a/full_models/kor/D_100000.pth b/full_models/kor/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe1f29545d68d3fb1483fd949b613a32b6e6d5f5 --- /dev/null +++ b/full_models/kor/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f596874046b9212b084813629815a656a4f147b7e03486155489819d543f376 +size 561110126 diff --git a/full_models/kor/G_100000.pth b/full_models/kor/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d84393fb3257afbe56c61ddf797d82432b606ebd --- /dev/null +++ b/full_models/kor/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5834075b1f9190b0c76129b3de502110461e37288d83f79c442271d44b1485 +size 436588317 diff --git a/full_models/kor/config.json b/full_models/kor/config.json new file mode 100644 index 0000000000000000000000000000000000000000..993d1dedb1d0c8e820b98f9e2f019ff166327038 --- /dev/null +++ b/full_models/kor/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.uroman", + "validation_files": "dev.uroman", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kor/vocab.txt b/full_models/kor/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..c7a54775f378fb2fd26d2a43d1bd850639ea221e --- /dev/null +++ b/full_models/kor/vocab.txt @@ -0,0 +1,25 @@ +u +_ +t +w +s +o +y +a +h +i +j +- +k +b +c +' +n +l +d +g +r + +e +m +p diff --git a/full_models/kpq/D_100000.pth b/full_models/kpq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9af092974e9827a29f5b01fd99db064dbfab01d1 --- /dev/null +++ b/full_models/kpq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b47d97c95195ecb74c683ba71a967aee19f4060df702b403ccb5b93b0ee160 +size 561078981 diff --git a/full_models/kpq/G_100000.pth b/full_models/kpq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ed847ef69c2ee4476692a330c0e798ae9e8de90 --- /dev/null +++ b/full_models/kpq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca7183dbe6f25a982f8bdab4209399b455f9bb85944002478f3676e8722fd3c +size 436379972 diff --git a/full_models/kpq/config.json b/full_models/kpq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kpq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kpq/vocab.txt b/full_models/kpq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fb5c16ea47107f435aaeb056ac29cb2485c3cd58 --- /dev/null +++ b/full_models/kpq/vocab.txt @@ -0,0 +1,37 @@ +- +g +o +t +f +1 +_ +z +l +– +' +s +u +m +b +i +j +3 +p +0 +7 +k +r +e +2 +w +y +d +́ +4 + +a +5 +n +h +c +9 diff --git a/full_models/kps/D_100000.pth b/full_models/kps/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4871870a23283a229a115a9196b5251f07645674 --- /dev/null +++ b/full_models/kps/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6455663bf6e84d825131cdf5be912ef58ca9207259060f685f7da89216002cf8 +size 561075775 diff --git a/full_models/kps/G_100000.pth b/full_models/kps/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9a40ba908b662671d185087d27cee21a6db9fbed --- /dev/null +++ b/full_models/kps/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc2ff659e3017f3bc0970491d6665741c0e9a79e6942ef3aaa092221e18ce4c +size 436333749 diff --git a/full_models/kps/config.json b/full_models/kps/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kps/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kps/vocab.txt b/full_models/kps/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..301a1c4aa65af6ccbb4333ac3b8489674827506d --- /dev/null +++ b/full_models/kps/vocab.txt @@ -0,0 +1,28 @@ +| +a +i +o +e +n +t +k +m +w +s +y +r +l +f +h +d +u +b +g +p +- +j +– +z +c +' + diff --git a/full_models/kpv/D_100000.pth b/full_models/kpv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..87d404807bb3865a4903aacb8819db4d2c56a7e5 --- /dev/null +++ b/full_models/kpv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728f6d31d58ecd27b49088afc31949a7589fdd3525ee583d62431472658f567d +size 561079019 diff --git a/full_models/kpv/G_100000.pth b/full_models/kpv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5d58f04f26a5f55ab1287c3d74f9a0655e1f094a --- /dev/null +++ b/full_models/kpv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d61cfcd350f02270b0d5cfa680185541aebac5979422c476cc4beac50d472a23 +size 436387467 diff --git a/full_models/kpv/config.json b/full_models/kpv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kpv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kpv/vocab.txt b/full_models/kpv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1b5104e27669268faac9df899632a01fc48b456d --- /dev/null +++ b/full_models/kpv/vocab.txt @@ -0,0 +1,40 @@ +м +н +ö +б +в +ъ + +ы +я +р +_ +л +к +т +ш +– +i +с +ц +г +ё +п +ю +а +ь +о +е +д +и +і +з +ж +ф +й +- +х +у +щ +э +ч diff --git a/full_models/kpy/D_100000.pth b/full_models/kpy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5dd0e04d45e3807ffa5ec44cb58ad313ac9ec978 --- /dev/null +++ b/full_models/kpy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d96e5e6bc328870dd102ffce4a115892d3b71c4e4518f244b57276f615acf0cf +size 561076156 diff --git a/full_models/kpy/G_100000.pth b/full_models/kpy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..711770cccf24f5ebee271fd604428d9831ac93c6 --- /dev/null +++ b/full_models/kpy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5822102333aa6f0f6517f257f88c70f958bb3cc2c565164c385b22373515f8b3 +size 436362033 diff --git a/full_models/kpy/config.json b/full_models/kpy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kpy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kpy/vocab.txt b/full_models/kpy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e3a9354c3150ab27176a74305072a0fb30ab9b9f --- /dev/null +++ b/full_models/kpy/vocab.txt @@ -0,0 +1,39 @@ +у +ц +о +х +' +ӈ +ч +в +ж +ӄ + +ю +т +– +й +а +ф +э +ш +я +д +р +е +г +и +_ +н +м +ь +л +ё +с +- +ы +з +к +ъ +б +п diff --git a/full_models/kpz/D_100000.pth b/full_models/kpz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c843c0ee2d05a44e1df08fa1de00cca5dd3da9be --- /dev/null +++ b/full_models/kpz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbe18378171ac174f423275847b199d3ed061c8e639dec5d77f865dfa207384f +size 561109872 diff --git a/full_models/kpz/G_100000.pth b/full_models/kpz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..64c26d51ab552d3f9b741218ab728253b82ed98a --- /dev/null +++ b/full_models/kpz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:399584dffd19bbad02acd46f6a752fd4a0f779113dc752a4fd79a5947b42b99a +size 436586043 diff --git a/full_models/kpz/config.json b/full_models/kpz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kpz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kpz/vocab.txt b/full_models/kpz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..07dd08470081dac8cccdcd0ff5a2c9d89f56b9b6 --- /dev/null +++ b/full_models/kpz/vocab.txt @@ -0,0 +1,26 @@ +| +o +k +e +t +y +n +i +u +a +m +p +c +w +l +r +s +ŋ +ö +' +ä +f +ë +ü +- + diff --git a/full_models/kqe/D_100000.pth b/full_models/kqe/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1c89d332ab7bfff256ccbc21727a6fc95dc8a59 --- /dev/null +++ b/full_models/kqe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35f0a5afd87de778d431cbb44f170b32b5f2a8da931e4f0f62b03dc7ff1ab005 +size 561078726 diff --git a/full_models/kqe/G_100000.pth b/full_models/kqe/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..297d166d32081621b60a867d8d8dde491d18d284 --- /dev/null +++ b/full_models/kqe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:407d00e20b91655a4cd08d95ca4aa48510cb9ea145959caeb476576c54ce9b7a +size 436371772 diff --git a/full_models/kqe/config.json b/full_models/kqe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kqe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kqe/vocab.txt b/full_models/kqe/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d4e742b25c2103bde42b6a242afd7c092572c4d7 --- /dev/null +++ b/full_models/kqe/vocab.txt @@ -0,0 +1,35 @@ +0 +t +i +b +3 +r +1 +w +o +n +p +h +z +u +6 +- +5 +4 +y +s +a +g +_ +7 +e +l +k + +m +9 +8 +j +2 +' +d diff --git a/full_models/kqp/D_100000.pth b/full_models/kqp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4705b8a1364fa2ae0d30247974503c0fce38aad --- /dev/null +++ b/full_models/kqp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c58bb2ab3e920842b614647ddd8763c18aede54f86a471dfe98f599dab51464 +size 561109981 diff --git a/full_models/kqp/G_100000.pth b/full_models/kqp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..615a177b745bd26b47fb78855b6268ec51fc64d7 --- /dev/null +++ b/full_models/kqp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c1e8cfb4dac15325089b445c6601c4be43cee08f8a31d90962d490ddb79c057 +size 436605959 diff --git a/full_models/kqp/config.json b/full_models/kqp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kqp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kqp/vocab.txt b/full_models/kqp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..391f1cac1a86dcf8c504abe7b44620001c2f84cd --- /dev/null +++ b/full_models/kqp/vocab.txt @@ -0,0 +1,33 @@ +| +a +e +n +i +ô +r +b +m +k +ɲ +y +é +w +ê +l +g +o +h +t +s +u +ŋ +j +d +p +ɗ +ɓ +c +à +á +- + diff --git a/full_models/kqr/D_100000.pth b/full_models/kqr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fed2ae7ab3ce465422e36d05aaf4f18ff6319e08 --- /dev/null +++ b/full_models/kqr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:681261dd92b70fbeedcf98b4e62d1d5b9cb96164a15d175d2c2202c6f77d2633 +size 561078735 diff --git a/full_models/kqr/G_100000.pth b/full_models/kqr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c8e3a2ce6efd31e77ba0a6e2be97680d674a2443 --- /dev/null +++ b/full_models/kqr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9efc2f7c8baa8d53663509b5c3e302fd56a301d20ab4bbee8c7e45383731fa5 +size 436390444 diff --git a/full_models/kqr/config.json b/full_models/kqr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kqr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kqr/vocab.txt b/full_models/kqr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2f6957e9fa173fcb9bcbd8286964b640cb890608 --- /dev/null +++ b/full_models/kqr/vocab.txt @@ -0,0 +1,43 @@ +_ + +' +i +s +û +w +l +a +5 +- +d +4 +m +n +h +b +ô +r +î +y +e +1 +v +g +õ +k +2 +t +c +â +j +z +– +o +f +6 +8 +3 +0 +u +p +ê diff --git a/full_models/kqy/D_100000.pth b/full_models/kqy/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..829228e8cdd2e12a4d1a03743bbe119cfb8bda8f --- /dev/null +++ b/full_models/kqy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e02310d60dd276842331899aefa27f7245d5d75fcfe8fda704fe586924d5426 +size 561078723 diff --git a/full_models/kqy/G_100000.pth b/full_models/kqy/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..31368fdc16b13b72c641b89282da29a88b61f494 --- /dev/null +++ b/full_models/kqy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610c4219d9f67ddde1cf390299f2e62b06215face8080fa72bd44dc9888f31ba +size 436697453 diff --git a/full_models/kqy/config.json b/full_models/kqy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kqy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kqy/vocab.txt b/full_models/kqy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f4eced93fb91d077c1d1e3f62dc89d5b3bdcfac0 --- /dev/null +++ b/full_models/kqy/vocab.txt @@ -0,0 +1,175 @@ +| +ን +ኤ +ይ +ሴ +ዬ +ኮ +ስ +አ +ህ +ድ +ዎ +ኡ +ሀ +ረ +ተ +ቶ +ሰ +ነ +ወ +ኔ +ዴ +ኬ +ማ +ሱ +ቤ +ቴ +ገ +ዶ +ት +መ +ኦ +የ +ር +ኑ +ጌ +ሥ +በ +ሶ +ከ +ደ +ሮ +ፈ +ግ +እ +ብ +ም +ለ +ሸ +ኣ +ቱ +ቄ +ቸ +ሎ +ሜ +ል +ዮ +ታ +ክ +ሽ +ሤ +ዼ +ጉ +ዝ +ባ +ሞ +ፌ +ሳ +ሩ +ሌ +ጎ +ኩ +ሬ +ዜ +ቦ +ካ +ሡ +ቾ +ሄ +ቡ +ቁ +ላ +ሁ +ሦ +ዽ +ሼ +ሙ +ዘ +ዸ +ዾ +ጽ +ፍ +ያ +ዱ +ሉ +ኢ +ቅ +ፉ +ጩ +ና +ሹ +ዉ +ዋ +ዞ +ጼ +ቆ +ጹ +ች +ሃ +ዹ +ጸ +ው +ሚ +ሾ +ፋ +ዙ +ሲ +ጭ +ጬ +ጾ +ሠ +ሆ +ጮ +ኖ +ጰ +ዳ +ጵ +ዲ +ዤ +ቼ +ቀ +ጋ +ሻ +ራ +ጄ +ዩ +ፎ +ጴ +ዠ +ዌ +ጫ +ሣ +ጨ +ቹ +ዛ +ዻ +ቃ +ዥ +ጺ +ጻ +ኒ +ጶ +ቻ +ሂ +ጳ +ዺ +ፊ +ኪ +ቢ +ዡ +ዦ +ዣ +ቂ +ሊ +ጱ +ዪ +ጅ +- +ሺ +ዢ +– +ጁ +ዚ +ጊ + diff --git a/full_models/krc/D_100000.pth b/full_models/krc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0fef6d04a4fa2b4d170ebed558b359a9ad26174b --- /dev/null +++ b/full_models/krc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e5133d7205d5da0d1cb34d746310776e60745bf090812bdcba3ad888b20432 +size 561079104 diff --git a/full_models/krc/G_100000.pth b/full_models/krc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5b5b1f89c644c197e48adff6b8da81b0c909d737 --- /dev/null +++ b/full_models/krc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b5ff1d9aa2413e60134d7ddfa699fe963d5e85f595a04b6f77712c97fe4285 +size 436380560 diff --git a/full_models/krc/config.json b/full_models/krc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/krc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/krc/vocab.txt b/full_models/krc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e69ea0663ca24dfb35a30dbf030ca7ca02409522 --- /dev/null +++ b/full_models/krc/vocab.txt @@ -0,0 +1,37 @@ +| +а +н +л +и +е +ы +д +р +г +к +у +ъ +т +б +с +м +ю +з +й +о +х +э +п +ш +ч +ж +ё +я +– +ф +- +ь +в +' +ц + diff --git a/full_models/kri/D_100000.pth b/full_models/kri/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5777af0afe2ef18bdb2d19a646d81877d4128598 --- /dev/null +++ b/full_models/kri/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0affae12a3d8d19f3b4edfe14a5aa6dfe8456ca3fcd12fba1c9db7ef58fd88f1 +size 561110020 diff --git a/full_models/kri/G_100000.pth b/full_models/kri/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..48758a7cba81b051f8e00b41665dc83b37c22836 --- /dev/null +++ b/full_models/kri/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d54e43fa141aac982e4b819f13ce2d4124ea32a385a2611b86b0ca0e21421a6 +size 436597910 diff --git a/full_models/kri/config.json b/full_models/kri/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kri/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kri/vocab.txt b/full_models/kri/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ab5fd19f4d4c86e0e68d21d8f47dc0520b056fb8 --- /dev/null +++ b/full_models/kri/vocab.txt @@ -0,0 +1,30 @@ +| +n +i +a +d +ɔ +ɛ +e +t +s +w +l +m +k +u +p +g +b +f +o +r +y +j +z +v +h +c +- +' + diff --git a/full_models/krj/D_100000.pth b/full_models/krj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8eb8f67c1408ab8d81ac346de990443c0f92eb27 --- /dev/null +++ b/full_models/krj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149b2a93c81ab76dc7d012c516118f5c1bfffa30f6bbbacfeeaf3193432dbb66 +size 561109856 diff --git a/full_models/krj/G_100000.pth b/full_models/krj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..85d7fd9e957d1ac3cb644eb83f6ba7332aacd524 --- /dev/null +++ b/full_models/krj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d96549b7f67ce6a4835c4a85a2123790efe795ae439f9657224276fee62ef4e +size 436615972 diff --git a/full_models/krj/config.json b/full_models/krj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/krj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/krj/vocab.txt b/full_models/krj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e9b12bb29941fb47b790089eec450118c33696a6 --- /dev/null +++ b/full_models/krj/vocab.txt @@ -0,0 +1,39 @@ +a +| +n +g +i +k +o +u +m +s +t +d +p +r +l +y +b +h +w +e +- +j +c +' +f +z +0 +v +q +— +1 +2 +x +4 +3 +5 +7 +6 + diff --git a/full_models/krl/D_100000.pth b/full_models/krl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1435d4ca41c3e7e88891548f87ee9037a1f96f72 --- /dev/null +++ b/full_models/krl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003f2052e58a6826d20dd953ce7dcde08e247cac861cfa14eba59845224ad0af +size 561078838 diff --git a/full_models/krl/G_100000.pth b/full_models/krl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..231c43f37bcbda09b5c61813edf5f0486e930516 --- /dev/null +++ b/full_models/krl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d31618ccb64d10d8847d6cbefe98bf7d1f39ce14fb962479eade74512aa5cc9b +size 436364598 diff --git a/full_models/krl/config.json b/full_models/krl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/krl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/krl/vocab.txt b/full_models/krl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..690407f01b502c0923c0b0831db40ed741f51fe3 --- /dev/null +++ b/full_models/krl/vocab.txt @@ -0,0 +1,31 @@ +j +l +f +č +- +i +o +a +u +m +e +_ + +b +p +' +y +h +g +ö +n +v +k +– +d +z +r +š +t +ä +s diff --git a/full_models/krr/D_100000.pth b/full_models/krr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8472608793aa87597953f0ff49451795df0f915f --- /dev/null +++ b/full_models/krr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add751b9db7a84d60ef891920567c8836692c35bf64f6e8f28d7887492b37be1 +size 561076188 diff --git a/full_models/krr/G_100000.pth b/full_models/krr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f966407c5085567f22d5cab3a4d2819a9c191106 --- /dev/null +++ b/full_models/krr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e76e89beb00538f9c220143b637db7162e8e9c8ebec7910f579e849ca829ff +size 436406588 diff --git a/full_models/krr/config.json b/full_models/krr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/krr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/krr/vocab.txt b/full_models/krr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2873f65e7534bd978db9ceb189d5d26539d7a663 --- /dev/null +++ b/full_models/krr/vocab.txt @@ -0,0 +1,58 @@ +| +ា +ែ +ម +រ +៉ +អ +្ +៊ +ត +ប +ន +ង +ក +ហ +់ +យ +គ +ស +ូ +ៃ +ឡ +វ +ិ +ី +ដ +ឹ +ើ +ះ +ព +ច +ឌ +ុ +ំ +ឺ +ល +ទ +ៀ +ណ +ឝ +ញ +ឆ +ឿ +ឞ +ខ +ឋ +ោ +ួ +ជ +ផ +ឃ +ឈ +ឍ +ថ +ភ +ធ +៝ + diff --git a/full_models/krs/D_100000.pth b/full_models/krs/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1b8d9aa1c1ea4697b5ad6a7ec27cfba7d20871c9 --- /dev/null +++ b/full_models/krs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e125dbe863c9b8cae2a49421cdd3c20a19a6fc7a2ccca3de10086446aed2bdbb +size 561079226 diff --git a/full_models/krs/G_100000.pth b/full_models/krs/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5632dfa933abb47a7839e090dc9d3bf947dbff18 --- /dev/null +++ b/full_models/krs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff40033b37324449c760dff10800136bf1c3e5efd174bc656921e80a3aafa955 +size 436409484 diff --git a/full_models/krs/config.json b/full_models/krs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/krs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/krs/vocab.txt b/full_models/krs/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b216fcf6909a37fe7d01097d34f4055748caced7 --- /dev/null +++ b/full_models/krs/vocab.txt @@ -0,0 +1,51 @@ +ꞌ +ö +ï +s +ü +z +ã +é +l +- +ĕ +ó +â +w +_ +ẽ +ĩ +' +j +ũ +p +r +ä +û +ŋ +h +ŭ +ë +t +b +õ +n +ă +ĭ +ô +ê +á +m +ḷ +ŏ +c +f +d +k +v +î +í +y +g + +ú diff --git a/full_models/kru/D_100000.pth b/full_models/kru/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a9abf9e64c04489200084d1087d9522823651c5b --- /dev/null +++ b/full_models/kru/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3e0b138c8154ea9001835b60aaffc3ff01dea06ae1f420e6c5492621d3a343 +size 561078877 diff --git a/full_models/kru/G_100000.pth b/full_models/kru/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bd3dec6d6375c1164b68a303dd96c6e544f422f2 --- /dev/null +++ b/full_models/kru/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c112dfac99f99d8f301d7816335df7e9fcc023e18b2194ce3479684f72c4469 +size 436434611 diff --git a/full_models/kru/config.json b/full_models/kru/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kru/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kru/vocab.txt b/full_models/kru/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9b6bfb401bd41facfdcc00bc0d9d9b9917474cb9 --- /dev/null +++ b/full_models/kru/vocab.txt @@ -0,0 +1,61 @@ +य +ॆ +े +प +' +च +ध +ै +ई +ृ +घ +़ +् +ऒ +ॊ +व +भ +झ +ओ +त +ं + +औ +ज +अ +ु +ख +ल +_ +‍ +इ +ठ +ग +- +ि +छ +ब +स +न +ू +द +म +ढ +र +थ +फ +ो +आ +ौ +ह +ड +ऎ +ी +ए +ट +ऐ +क +ा +ँ +ऊ +उ diff --git a/full_models/ksb/D_100000.pth b/full_models/ksb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..beffa678ee16f7dd0df32a99c303082881c47176 --- /dev/null +++ b/full_models/ksb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bece9cbab52a4ca6eb01d914d9c7d9fe425aca1203cce5497f0002f37c7aeb11 +size 561079121 diff --git a/full_models/ksb/G_100000.pth b/full_models/ksb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f74f084f7b627d8ec031b05f6560ea0101084a31 --- /dev/null +++ b/full_models/ksb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f74a1ef00f55d3cdbe8ca8382395f36984919b458ae4dd474140e04860adbb4 +size 436366861 diff --git a/full_models/ksb/config.json b/full_models/ksb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ksb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ksb/vocab.txt b/full_models/ksb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9b6fcc3e7ca96cc7a694c3d42aa9764d15f92039 --- /dev/null +++ b/full_models/ksb/vocab.txt @@ -0,0 +1,31 @@ +g +t +ṃ +i +y +k +l + +' +e +r +m +w +ṅ +c +o +j +— +d +a +_ +z +h +v +p +n +f +b +ú +s +u diff --git a/full_models/ksr/D_100000.pth b/full_models/ksr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a7cf886d9f837f1b7e70c30b821ba831b4368c2 --- /dev/null +++ b/full_models/ksr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5ed7e42f7df2d5e594e571dd3996859bd7cbf82bf88bff4670d36a9e35f8832 +size 561077818 diff --git a/full_models/ksr/G_100000.pth b/full_models/ksr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d7a67ae98f54b8384be7134c5a74e986d9d332f6 --- /dev/null +++ b/full_models/ksr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a278c4446882e3c0eaaf8b280ad1416bb3f9a77d74a061b1aa8d135f7e17a0f1 +size 436374118 diff --git a/full_models/ksr/config.json b/full_models/ksr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ksr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ksr/vocab.txt b/full_models/ksr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d3cdbc507409b68735a156ec430ef03ca7aaaa76 --- /dev/null +++ b/full_models/ksr/vocab.txt @@ -0,0 +1,40 @@ +a +| +o +ŋ +i +e +m +n +k +u +g +j +l +t +w +r +s +b +q +y +d +p +h +z +- +f +0 +1 +7 +4 +2 +5 +' +6 +3 +9 +8 +c +v + diff --git a/full_models/kss/D_100000.pth b/full_models/kss/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..55f68aef655d5e677e59997d2102e33b824ebba2 --- /dev/null +++ b/full_models/kss/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8809e922759cc13ee30ca7dd50f4677ca3bcea1e1d5d3753ae51616786c58b94 +size 561106313 diff --git a/full_models/kss/G_100000.pth b/full_models/kss/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..960379ff919f4f83e478f6ba11930a6a89c884a8 --- /dev/null +++ b/full_models/kss/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00753cc3d3a36b5d033a61be96a72c2f5be4f38d62d6b3281b5cd4fb6f3623a0 +size 436587553 diff --git a/full_models/kss/config.json b/full_models/kss/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kss/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kss/vocab.txt b/full_models/kss/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bfc576e2e30d011c954bc7def2801665cb1fcbb0 --- /dev/null +++ b/full_models/kss/vocab.txt @@ -0,0 +1,38 @@ +| +̍ +a +ā +n +l +ɛ +̄ +o +ŋ +m +i +d +ɔ +ī +k +h +y +e +u +ō +w +ū +c +s +p +t +b +᷄ +ē +᷅ +f +g +v +- +j +' + diff --git a/full_models/ktb/D_100000.pth b/full_models/ktb/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..19f07e5cea99c318e8af00281b89d1d27aac56ef --- /dev/null +++ b/full_models/ktb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ef92d817221bf3917ae9380ff8608ac385f25d98422f64eadf13cf1f20c34f +size 561079105 diff --git a/full_models/ktb/G_100000.pth b/full_models/ktb/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..0d150e2fe744b7edacbe74f9791bf0151337fe21 --- /dev/null +++ b/full_models/ktb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771607e06782e4495c6d4d8691a637be50be7eee49898992a418fdc26ab1c08e +size 436721385 diff --git a/full_models/ktb/config.json b/full_models/ktb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ktb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ktb/vocab.txt b/full_models/ktb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4810516df8da58b41a5a493869bbe3dc54df4570 --- /dev/null +++ b/full_models/ktb/vocab.txt @@ -0,0 +1,185 @@ +| +ን +አ +እ +መ +ተ +ስ +ገ +ት +ም +ዕ +ኔ +በ +ሰ +ከ +ር +ኖ +ህ +ች +ኒ +ነ +ኑ +ደ +ኩ +ዬ +ሱ +ጠ +ረ +ለ +ክ +ሁ +ኦ +ሀ +ቀ +ቶ +ል +ሃ +ዮ +ማ +ሆ +ኬ +ኤ +ሞ +ዳ +ኮ +ቹ +ና +ኣ +ሴ +ታ +ሶ +ቴ +ዎ +ሜ +ጡ +ኡ +ሩ +ሬ +ይ +ብ +ሳ +ዘ +ኢ +ቱ +ባ +ጉ +ሌ +ሮ +ዶ +ላ +ሙ +የ +ግ +ድ +ቆ +ራ +ፈ +ፉ +ጋ +ቡ +ሄ +ሲ +ሽ +ቅ +ጃ +ቤ +ቦ +ሎ +ዋ +ሪ +ካ +ሉ +ቄ +ያ +ጎ +ቲ +ቾ +ፍ +ሚ +ቃ +ጅ +ዱ +ኪ +ጥ +ዉ +ጣ +ዲ +ሸ +ሊ +ሾ +ቢ +ወ +ው +ጀ +ጨ +ቺ +ጢ +ጦ +ጌ +ጮ +ፎ +ጩ +ጭ +ጤ +ሂ +ጊ +ዜ +ጄ +ቁ +ቼ +ጵ +- +ዊ +ሻ +ቸ +ዛ +ሼ +ጳ +ዴ +ጆ +ዝ +ፌ +ጫ +ዪ +ፋ +ጰ +ጴ +ሹ +ኗ +ጬ +ቂ +ዞ +ሺ +ዩ +ዙ +ጪ +ቿ +ቻ +ፊ +ሟ +ጁ +ቧ +ዚ +ጶ +ዌ +ጂ +ቷ +ጲ +ሏ +ጧ +ሯ +ጱ +ሷ +ኘ +ሿ +ዷ +ዟ +ዦ +ኙ +ጷ +ቋ +ኳ +ጯ +ፏ + diff --git a/full_models/ktj/D_100000.pth b/full_models/ktj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8440d979ed69496758a4a80002b32e5b6c62797f --- /dev/null +++ b/full_models/ktj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5811ae926dcbdd8d28bbf6555f53a3d1843b328c9a885567e97b0758956c567e +size 561078457 diff --git a/full_models/ktj/G_100000.pth b/full_models/ktj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91ae198d084276de93d2917eef22ff432f91c1ef --- /dev/null +++ b/full_models/ktj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae09fa67fc4607c26ab4d422c150df6a761689dddbbf5494e4aa652dc5074c9 +size 436371255 diff --git a/full_models/ktj/config.json b/full_models/ktj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ktj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ktj/vocab.txt b/full_models/ktj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..319093e59f0e13ab6842a3f3cab9cfc388b5ff59 --- /dev/null +++ b/full_models/ktj/vocab.txt @@ -0,0 +1,35 @@ +k +ɛ +p +a +i +꞊ +2 +ɩ +w +h +_ +j +b +y +l +ʋ +r +o +ɔ +s +c +ŋ +' +‐ +g + +d +ԑ +f +n +0 +m +e +u +t diff --git a/full_models/kub/D_100000.pth b/full_models/kub/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e8fa68e0dec367174ab4db8b1bece6876b3c2349 --- /dev/null +++ b/full_models/kub/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23bac86e2cb5cda9f524ce96bf635d2cfb271eaa34ee19dea1142fd95e37368b +size 561078864 diff --git a/full_models/kub/G_100000.pth b/full_models/kub/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cdbf2e2a0e8bca34b4b4daa33ff1b4421aae905e --- /dev/null +++ b/full_models/kub/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3cea48143b9dbcc83d552c22afc5983f2aff7197b19d5b08ec82eec90958816 +size 436633637 diff --git a/full_models/kub/config.json b/full_models/kub/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kub/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kub/vocab.txt b/full_models/kub/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6f73db8a3f7c767bc3c8544a450dc241d9c06b15 --- /dev/null +++ b/full_models/kub/vocab.txt @@ -0,0 +1,45 @@ +| +n +a +t +ī +i +e +k +u +w +m +s +b +ā +r +á +y +ū +ú +g +í +é +ē +d +- +f +p +ō +j +c +ó +o +h +x +l +' +z +ù +à +v +ḿ +ì +è +– + diff --git a/full_models/kue/D_100000.pth b/full_models/kue/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d64c1f8ad43aa8a4d7cbd14d87499da014a76d99 --- /dev/null +++ b/full_models/kue/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1cbf3d5b007e0aa5d5d94b034351e79423c3ce592dcd8c66fae9ba1b4e79e67 +size 561109893 diff --git a/full_models/kue/G_100000.pth b/full_models/kue/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..795843982501c97be685dfceef27d42e1bbc7975 --- /dev/null +++ b/full_models/kue/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdd75c228fcdccd3bce3ab8a0d7323af505fc29b57fbdbf2ac3b45de50ccfae5 +size 436609575 diff --git a/full_models/kue/config.json b/full_models/kue/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kue/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kue/vocab.txt b/full_models/kue/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3f0d37c9f018defd4f5a5c7f44f1e1882a730eb6 --- /dev/null +++ b/full_models/kue/vocab.txt @@ -0,0 +1,36 @@ +| +a +e +n +i +g +o +m +k +r +l +u +d +y +w +b +p +t +s +- +h +j +v +0 +f +1 +2 +7 +' +4 +5 +3 +6 +8 +9 + diff --git a/full_models/kum/D_100000.pth b/full_models/kum/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..009cc378442216471abd10531c8dec6ae6c0c808 --- /dev/null +++ b/full_models/kum/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e1ea64a894faa95c0835c22119750ed5c03ae31a45e7ef377f020ed8399e22 +size 561110094 diff --git a/full_models/kum/G_100000.pth b/full_models/kum/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..46fd9fcddffbe6975a1f6047363d9019f0fce013 --- /dev/null +++ b/full_models/kum/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c1135e5e6d49306ba773ea22ade8a00d9813f49dbe602d6255bddd6ef8da153 +size 436617123 diff --git a/full_models/kum/config.json b/full_models/kum/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kum/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kum/vocab.txt b/full_models/kum/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e1158ddb2ca6a7b25e3858045716362fe8fb6530 --- /dev/null +++ b/full_models/kum/vocab.txt @@ -0,0 +1,39 @@ +| +а +н +л +е +г +и +р +ы +ъ +д +у +б +к +т +м +с +о +з +ю +ь +й +п +ш +в +ч +я +э +ё +ж +х +– +ф +0 +1 +2 +4 +ц + diff --git a/full_models/kus/D_100000.pth b/full_models/kus/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3459412a658c348ed229ecde70546a72e70fd588 --- /dev/null +++ b/full_models/kus/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2314f0e90de15dcb6452e266a9587dfd62df0d5e5066b0045f3a5d970edeacfe +size 561109876 diff --git a/full_models/kus/G_100000.pth b/full_models/kus/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3af512a5e23b3b6dbb6c25941d5ae1899fdd3796 --- /dev/null +++ b/full_models/kus/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de2041aa63fa1c94bd8f0bab48ba955e1402b70ba04cc56770c56ac4567ad1b +size 436590655 diff --git a/full_models/kus/config.json b/full_models/kus/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kus/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kus/vocab.txt b/full_models/kus/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0a9d3a94cd9d991a772d85d77975458fd7d8149d --- /dev/null +++ b/full_models/kus/vocab.txt @@ -0,0 +1,28 @@ +| +a +i +n +e +u +m +o +l +k +s +b +' +y +d +t +g +p +ŋ +r +w +z +f +j +v +h +- + diff --git a/full_models/kvn/D_100000.pth b/full_models/kvn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b700b00f65cf2b53165f573ec8a6236fd66870bc --- /dev/null +++ b/full_models/kvn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042f484c5966958b4ef47af652c11e418a38e16cc7e7b7d18dc211d61c58faf4 +size 561078720 diff --git a/full_models/kvn/G_100000.pth b/full_models/kvn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c09b02057e91eb30b1bf04f635ca4cde4256f0c0 --- /dev/null +++ b/full_models/kvn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bfec857a2e9bbedb7b54683dabf62cd69c5f20d43f5a1b3373e82f611b34678 +size 436398177 diff --git a/full_models/kvn/config.json b/full_models/kvn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kvn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kvn/vocab.txt b/full_models/kvn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3175a810788c1c34cd8dfca7fd8d31e037867368 --- /dev/null +++ b/full_models/kvn/vocab.txt @@ -0,0 +1,46 @@ +m +d +f +p +h +e +k +— +8 +i +b +o +a +í +c +4 +3 +' +6 +l +g +1 +y +0 +n +9 +w +t +é +q +2 +s +_ +v +r +z +- +á +ó +5 +x +j +ú +u + +7 diff --git a/full_models/kvw/D_100000.pth b/full_models/kvw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e485ae87fd2102132398633ae20d921d3b6fa8e7 --- /dev/null +++ b/full_models/kvw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28eb7f0b46b5f99ae71b36495f7952f515ba202dc54c5bc1c0849834dfc76edc +size 561076024 diff --git a/full_models/kvw/G_100000.pth b/full_models/kvw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1f09f9b0b4082de6b06ab0a25e78b206abae2dd1 --- /dev/null +++ b/full_models/kvw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e33bfde40c5430e5a277311fbbfefbcc7368d5c6a581d75a4352edb4e3c45355 +size 436331351 diff --git a/full_models/kvw/config.json b/full_models/kvw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kvw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kvw/vocab.txt b/full_models/kvw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ed32def40a29abeb6e8d4ed61a87f68ac7fac741 --- /dev/null +++ b/full_models/kvw/vocab.txt @@ -0,0 +1,26 @@ +s +' +m +t +r +l +c +w +j +e +a +- +f +_ +o +n +y +p +d + +i +g +k +h +u +b diff --git a/full_models/kwd/D_100000.pth b/full_models/kwd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9cd495261a3680d045e0469acbc180774055ba16 --- /dev/null +++ b/full_models/kwd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0516b0d050a90f732b6dd4c322d438039f3f4a921dbd245e4fe088584b1a5c6 +size 561078719 diff --git a/full_models/kwd/G_100000.pth b/full_models/kwd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49685db5eae43d966eb14b6543578a07048ab792 --- /dev/null +++ b/full_models/kwd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edb75e7846976bfa787e7fa2a24710e07bae09dff4da1e6b000d94d44885c7a5 +size 436359744 diff --git a/full_models/kwd/config.json b/full_models/kwd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kwd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kwd/vocab.txt b/full_models/kwd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..25762f5209f9bbf44852a35b0932021a4a3a6ed0 --- /dev/null +++ b/full_models/kwd/vocab.txt @@ -0,0 +1,30 @@ +h +0 +f +_ +w +k +l + +g +j +v +t +1 +4 +n +r +o +6 +2 +d +e +m +' +p +i +u +s +b +— +a diff --git a/full_models/kwf/D_100000.pth b/full_models/kwf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe398f5ee484c096d0ca7e4a3dac26f357fca01d --- /dev/null +++ b/full_models/kwf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73cddf0b824e5e7eba38c6fcbee41dea4e42f1e88fca4cbeb4dd94d5a59419ea +size 561078710 diff --git a/full_models/kwf/G_100000.pth b/full_models/kwf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..588f7ed406d84870f195f8e81a2d7506c031287b --- /dev/null +++ b/full_models/kwf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d68de801421f5ebd0a7b1bc6d8abd5ce844db5715bd447ee18dc54e84313a9cb +size 436368942 diff --git a/full_models/kwf/config.json b/full_models/kwf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kwf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kwf/vocab.txt b/full_models/kwf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ba6c567fe60abb55cd18ca6d03637db89e6cacf4 --- /dev/null +++ b/full_models/kwf/vocab.txt @@ -0,0 +1,34 @@ +n +s +3 + +0 +1 +2 +l +4 +r +k +w +g +9 +c +h +i +b +f +a +6 +d +j +u +5 +p +t +_ +o +e +' +y +m +v diff --git a/full_models/kwi/D_100000.pth b/full_models/kwi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..54628754bfa3b2b09881f48973147f6f4a488d87 --- /dev/null +++ b/full_models/kwi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9004918ca5fa2c19e4f60eebef6eddcdf3ba3110c53af68de9010605a7e9dbf2 +size 561110238 diff --git a/full_models/kwi/G_100000.pth b/full_models/kwi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e0dace4820f067b080b90c9a0332575490e17158 --- /dev/null +++ b/full_models/kwi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5dc0fd026ccc523bee028c4a1e6450c2678a566145940be14e3144705901edc +size 436629952 diff --git a/full_models/kwi/config.json b/full_models/kwi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kwi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kwi/vocab.txt b/full_models/kwi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..66bd2832414dc1d5a115a1c2a38dbed4f25b2c7b --- /dev/null +++ b/full_models/kwi/vocab.txt @@ -0,0 +1,43 @@ +a +| +n +i +u +k +s +t +p +m +z +r +w +e +ɨ +h +l +o +c +d +j +ñ +y +ú +b +í +— +é +' +g +á +ĩ +f +ó +v +ã +q +0 +x +1 +2 +4 + diff --git a/full_models/kxc/D_100000.pth b/full_models/kxc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..072d41de981e070ce560b6dcb88cfda2674fc383 --- /dev/null +++ b/full_models/kxc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7493461b427857b55979789e031cc83bced96573550a7d05e397d986e551ca7e +size 561110140 diff --git a/full_models/kxc/G_100000.pth b/full_models/kxc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fee5af32f2d951af847f1398070c626c46586e0b --- /dev/null +++ b/full_models/kxc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49812d44369fd01f2f84539b2457b7ea16b2c20b5338c2e29c3475f0e65ce07 +size 436862528 diff --git a/full_models/kxc/config.json b/full_models/kxc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kxc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kxc/vocab.txt b/full_models/kxc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2366a9107dc89aa7a59119a9d1cf73c187f837a4 --- /dev/null +++ b/full_models/kxc/vocab.txt @@ -0,0 +1,144 @@ +| +ን +ከ +ተ +አ +እ +መ +ፐ +ረ +ነ +ሴ +ኦ +ሰ +ይ +ቀ +ዴ +ለ +ክ +ኔ +ስ +ር +ደ +ኤ +ዬ +ቶ +ፕ +ት +ቴ +ኮ +ል +ኖ +ም +ድ +ሾ +ሀ +ሽ +ሸ +ፖ +የ +ው +ዋ +ሌ +ወ +ኬ +ኩ +ኸ +ኡ +ቁ +ሱ +ሼ +ፎ +ታ +ሎ +ሞ +ሬ +ሜ +ቆ +ሶ +ሮ +ፈ +ማ +ካ +ዳ +ና +ፒ +ዮ +ቱ +ኪ +ሄ +ኣ +ጨ +ሃ +ቄ +ላ +ኾ +ኻ +ቅ +ፔ +ዌ +ፑ +ዶ +ያ +ዲ +ሙ +ሁ +ፓ +ቃ +ዱ +ፌ +ፉ +ቻ +ቾ +ጫ +ኑ +ፋ +ጩ +ሳ +ፍ +ቸ +ኼ +ህ +ሉ +ጬ +ቲ +ኹ +ሩ +ሆ +ራ +ሚ +ች +ኜ +ኘ +ጭ +ቺ +ዎ +ኒ +ሹ +ሲ +ኝ +ኽ +ሺ +ጵ +ጰ +ሻ +ቹ +ጪ +ዩ +ሪ +ጮ +ሂ +ሊ +ኙ +ኢ +ቂ +ኛ +- +ጴ +ጳ +ኞ +ጶ +ፊ +ኺ +ዊ + diff --git a/full_models/kxf/D_100000.pth b/full_models/kxf/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..04f3e30083c9e78b52d942d30febda39a56ae074 --- /dev/null +++ b/full_models/kxf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f38b0f3e8ed65feae0d029f711fa04e65b0f0c8f611e12c5a73c04d1a212e8f +size 561076164 diff --git a/full_models/kxf/G_100000.pth b/full_models/kxf/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9606e107ca9b326c06f5f9b95314d7426b667133 --- /dev/null +++ b/full_models/kxf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b5f1f4ce91e2bcfceb7e97785efa28b397809ff9843dbbe96b760e981e4f92 +size 436360151 diff --git a/full_models/kxf/config.json b/full_models/kxf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kxf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kxf/vocab.txt b/full_models/kxf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8ffcbdf0574b43d9d67c8b3dc90fc27e775168e9 --- /dev/null +++ b/full_models/kxf/vocab.txt @@ -0,0 +1,38 @@ +| +̌ +h +a +k +̤ +t +û +ô +s +ǎ +p +î +l +ò +n +ǒ +d +è +ě +m +b +e +y +u +w +o +ǐ +ǔ +g +c +i +ṳ +r +j +̂ +' + diff --git a/full_models/kxm/D_100000.pth b/full_models/kxm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4a7df0c380b67c0af337379d841a181245af4b40 --- /dev/null +++ b/full_models/kxm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b200c243eaf89895e2a26527c238c2c80552f0257bb3a2af0b8746303d098b6a +size 561109362 diff --git a/full_models/kxm/G_100000.pth b/full_models/kxm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf03330313c8302dfa1c79d58d3757542c00264e --- /dev/null +++ b/full_models/kxm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c09f583783d151e72a208e2b7faea519523848285b20c79a4d5256a0b40276b +size 436634510 diff --git a/full_models/kxm/config.json b/full_models/kxm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kxm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kxm/vocab.txt b/full_models/kxm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a96f6db397173c1d1821b819e8aa0facb4d4a849 --- /dev/null +++ b/full_models/kxm/vocab.txt @@ -0,0 +1,47 @@ +| +อ +เ +น +ฺ +ย +็ +ี +ร +ง +า +ฮ +ด +ม +ก +ิ +ป +บ +ั +ล +แ +จ +ต +ว +ซ +ค +ื +โ +ท +พ +ะ +ํ +ู +ญ +ุ +ึ +ช +ไ +ฟ +0 +1 +2 +' +` +๋ +- + diff --git a/full_models/kxv/D_100000.pth b/full_models/kxv/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f5b04713c4feca7ff7d933b795d6b61b9237536e --- /dev/null +++ b/full_models/kxv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233d2ba17df7e54846b4b519f8eb75f8d7fa8896c8ae00454c428272c854dab1 +size 561076027 diff --git a/full_models/kxv/G_100000.pth b/full_models/kxv/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f03235d2761117603c366007ce56a0b0d7dc71d7 --- /dev/null +++ b/full_models/kxv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3b55d3bf98ea34014ba0553a8f5818e2d14f73098e66808b3c19acd6b08c3ce +size 436368292 diff --git a/full_models/kxv/config.json b/full_models/kxv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kxv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kxv/vocab.txt b/full_models/kxv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f4dffbf98fa8df55ca78f34ff22d0606e1bd3043 --- /dev/null +++ b/full_models/kxv/vocab.txt @@ -0,0 +1,42 @@ +| +ା +ି +଼ +େ +ର +୍ +ତ +ନ +ଏ +ସ +ମ +ୁ +କ +ହ +ଁ +ଜ +ୱ +ଲ +ଇ +ଆ +ପ +ବ +ଣ +ଚ +ୀ +ଦ +ଗ +ଡ +ଟ +ୟ +ଞ +ଅ +ଙ +ୂ +ଈ +ଃ +ଂ +ଊ +ଉ +' + diff --git a/full_models/kyb/D_100000.pth b/full_models/kyb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4d12b1287b1fe50ec8e22b144c1eaaeeda149a12 --- /dev/null +++ b/full_models/kyb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdc5ba662f20733342dafe64f22d902c45824db3bbdb3857ade7bfb0c39a8de6 +size 561079257 diff --git a/full_models/kyb/G_100000.pth b/full_models/kyb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eaa5449e926d72b8e3f57490b4e2561f36393199 --- /dev/null +++ b/full_models/kyb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9641832a1fe5990f43c526bbaff5de0f544ab97071a484ddc706ab20dcc2c3 +size 436380755 diff --git a/full_models/kyb/config.json b/full_models/kyb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyb/vocab.txt b/full_models/kyb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e8d4ef95b1cddda0d1b1dbfbc3d5a4865dc82f94 --- /dev/null +++ b/full_models/kyb/vocab.txt @@ -0,0 +1,37 @@ +v +q +' +l +o +w +s +p +g +i +0 +1 +6 +d +– +j +3 +b +n +4 + +h +a +r +f +_ +x +m +z +u +t +- +— +c +k +e +y diff --git a/full_models/kyc/D_100000.pth b/full_models/kyc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d57a5accdc530e7008ee22fe290406ace8fb7a26 --- /dev/null +++ b/full_models/kyc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e701bfe1bdd54b8b032fd26c310ff01c4475758f81bccf71142b41e47919583 +size 561109612 diff --git a/full_models/kyc/G_100000.pth b/full_models/kyc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ac491cbf6b1ed00764518454226b4263d11557c --- /dev/null +++ b/full_models/kyc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ed0ab4dadf7aad6bbfcae6ede2e22ba8bd77a692b3f815edf84c99b8c3f7b8 +size 436611725 diff --git a/full_models/kyc/config.json b/full_models/kyc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyc/vocab.txt b/full_models/kyc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..38d0d1fb4700720e650717514c40ddaf1b90f7c0 --- /dev/null +++ b/full_models/kyc/vocab.txt @@ -0,0 +1,37 @@ +a +| +o +n +e +i +p +k +m +y +u +l +d +r +g +s +b +w +t +j +ŋ +- +0 +' +h +4 +1 +c +2 +6 +7 +3 +v +9 +f +` + diff --git a/full_models/kyf/D_100000.pth b/full_models/kyf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fdb62b89691cc9eb2dc770e30a9789ad23883544 --- /dev/null +++ b/full_models/kyf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2687a6862f023d08006b3e00efdd3df272ef417da6a7f39bb26a05c9db9b972e +size 561079472 diff --git a/full_models/kyf/G_100000.pth b/full_models/kyf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6c0ea70f46a0ec66126ed053f2df9953f0f72302 --- /dev/null +++ b/full_models/kyf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc6b223f8f55729951d183747a4f41a5394c36fe4c14fbe080e3d601eb059494 +size 436369955 diff --git a/full_models/kyf/config.json b/full_models/kyf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyf/vocab.txt b/full_models/kyf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..71abe31d5c43a8f97aa8546a2f920865a2238aa5 --- /dev/null +++ b/full_models/kyf/vocab.txt @@ -0,0 +1,32 @@ +s +ŋ +m +_ +j +g +h +w +e +ɔ +z +b +c +u +ʋ +ɩ +- +l +' +k +o +d +a +t +p +y +n +ɛ +f + +v +i diff --git a/full_models/kyg/D_100000.pth b/full_models/kyg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..715579b87c6fba0ec2bca61035874621a2a527b2 --- /dev/null +++ b/full_models/kyg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b47021b1e4a75dbb0c7818975e707e7ec53baf4fdfd50e54a99812ce070f4f96 +size 561076027 diff --git a/full_models/kyg/G_100000.pth b/full_models/kyg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d43e7b4bd0e288e17974dd95f39708d4a1b5d7de --- /dev/null +++ b/full_models/kyg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbea5a6fac6d473f699e03507b4cbde22816d58d2f41888dbdfdaa3d7dd7192a +size 436317603 diff --git a/full_models/kyg/config.json b/full_models/kyg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyg/vocab.txt b/full_models/kyg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..974557c8d6e19b425a4be03643311fa245259d55 --- /dev/null +++ b/full_models/kyg/vocab.txt @@ -0,0 +1,20 @@ +a +| +e +o +' +i +n +m +g +u +y +h +l +t +p +k +f +v +s + diff --git a/full_models/kyo/D_100000.pth b/full_models/kyo/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..4ca1141efabccee8268236e1bc8d87327da83b37 --- /dev/null +++ b/full_models/kyo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6032178c404132668b6c44a0fcdd916c52cb1ffd06eb010d7d56718b9b840bfc +size 561075941 diff --git a/full_models/kyo/G_100000.pth b/full_models/kyo/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..973b63a95b9457efeb31681cdc6d4cf6d7431efa --- /dev/null +++ b/full_models/kyo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2bc8988120627aa89b39e8224aadd79b6e0d1a60f28dd1020dc17080f556f3 +size 436338342 diff --git a/full_models/kyo/config.json b/full_models/kyo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyo/vocab.txt b/full_models/kyo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8f2aa1f41fb310af1250a70c414cfe92afcd7ec2 --- /dev/null +++ b/full_models/kyo/vocab.txt @@ -0,0 +1,29 @@ +| +a +n +g +i +o +e +é +h +u +l +k +m +y +d +b +t +r +s +ó +w +p +' +- +j +3 +7 +c + diff --git a/full_models/kyq/D_100000.pth b/full_models/kyq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a329579b81feb297e84ad5482bf5aa3fcd7c4e59 --- /dev/null +++ b/full_models/kyq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d9fd86d62841c7f867043888c6df9096e68ddb2f39468fcdf208c454af1d8f0 +size 561078341 diff --git a/full_models/kyq/G_100000.pth b/full_models/kyq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8ec941aee4bfc5e24432ca962dc5ee50bc7bc2f0 --- /dev/null +++ b/full_models/kyq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:489998c2d67d04a6df2941ea339ef6269fb45878535467393ea892e42b2ca222 +size 436364493 diff --git a/full_models/kyq/config.json b/full_models/kyq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyq/vocab.txt b/full_models/kyq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f4061bf0eb72bfa4e190d6dc3b9816fd0ec6d47c --- /dev/null +++ b/full_models/kyq/vocab.txt @@ -0,0 +1,32 @@ +| +a +e +n +k +ɔ +i +t +s +m +ɛ +g +o +u +ɗ +r +j +̰ +l +d +b +' +ŋ +y +ɓ +p +c +‐ +z +w +ƴ + diff --git a/full_models/kyu/D_100000.pth b/full_models/kyu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e64f5beb3bcbfbd6e1dc67c2523ff46ee890f51d --- /dev/null +++ b/full_models/kyu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35c17d3a8847c2ff6b27935375ad96c4b5b00d3cfdf530d9efea77eeb62dc5b7 +size 561076168 diff --git a/full_models/kyu/G_100000.pth b/full_models/kyu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c2f5fb407358798d1e8e8f6408e9978deddf9f43 --- /dev/null +++ b/full_models/kyu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df140fc2cb41b8a85e093b9abc0b6e85389f35cdad471a35c699abe58fe023a +size 436362535 diff --git a/full_models/kyu/config.json b/full_models/kyu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyu/vocab.txt b/full_models/kyu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cbffec343a3c5ab19a63c66c7426ce14ec7dbb7f --- /dev/null +++ b/full_models/kyu/vocab.txt @@ -0,0 +1,39 @@ +ꤢ +| +꤬ +ꤟ +꤭ +ꤩ +ꤛ +ꤧ +ꤣ +ꤒ +ꤔ +ꤪ +ꤚ +ꤤ +ꤨ +ꤕ +ꤊ +ꤥ +ꤜ +ꤗ +ꤌ +ꤞ +ꤘ +ꤡ +ꤋ +ꤦ +ꤙ +ꤓ +ꤖ +ꤏ +ꤝ +ꤠ +ꤑ +ꤐ +ꤍ +ꤎ +m +' + diff --git a/full_models/kyz/D_100000.pth b/full_models/kyz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a67a2e8d0abe1d35921b3ebead6ce6fcc970adaa --- /dev/null +++ b/full_models/kyz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee96e488c1e64367c5661756ea894385ff7d86d5662164e8ef851ecb2e265ef8 +size 561076188 diff --git a/full_models/kyz/G_100000.pth b/full_models/kyz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6110e0cc48ef73e99a6439d615d37ee989a6c1f4 --- /dev/null +++ b/full_models/kyz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9918f565b3dbd6472e3601f61c7960f7b14576951200014f1269599449dea67 +size 436360411 diff --git a/full_models/kyz/config.json b/full_models/kyz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kyz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kyz/vocab.txt b/full_models/kyz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7fa094fece1d390533b3a5e194b9e167fb0e903d --- /dev/null +++ b/full_models/kyz/vocab.txt @@ -0,0 +1,38 @@ +g +ẽ +e +4 +o +z +_ +v +ã +6 +a +r +k +— +m +c +ĩ +ũ +õ +w +s +l + +u +b +t +h +n +x +i +f +ỹ +0 +d +' +y +j +p diff --git a/full_models/kzf/D_100000.pth b/full_models/kzf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..449ba15330ff92dddf571fdc2b4eec4efbe7788f --- /dev/null +++ b/full_models/kzf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d5fb5f6f331e7d67da3daa6d83512210f76cd2285674a8798ef7a165b6f590 +size 561079016 diff --git a/full_models/kzf/G_100000.pth b/full_models/kzf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8d1eecfafd52eb8ae663b1f82165c7c652a26dd9 --- /dev/null +++ b/full_models/kzf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade2d287372ee59eeeb949c38f45854f03c80afee1f7d7a939db7c5c0dcce597 +size 436355292 diff --git a/full_models/kzf/config.json b/full_models/kzf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/kzf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/kzf/vocab.txt b/full_models/kzf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2e8dac141eea50f7a0099152878117fd3ac0924c --- /dev/null +++ b/full_models/kzf/vocab.txt @@ -0,0 +1,27 @@ +l +t +j +e +d +z +c +k +m +a +i +s +h +g +o +' +n +- +b +u +p +r +_ +y +f + +w diff --git a/full_models/lac/D_100000.pth b/full_models/lac/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..106cfee5d350fd276c45f7bdcada0078a41bcec6 --- /dev/null +++ b/full_models/lac/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36b26c328e2e896a2700ec67dc00e4ecf5f975b284c0c514ddf6f4c19c27cc7 +size 561078126 diff --git a/full_models/lac/G_100000.pth b/full_models/lac/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0ff0aa31971a314fe797e66fdf76e866257cec3c --- /dev/null +++ b/full_models/lac/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f1cac36ea2db23e0df4a0d6cbfd4324a9541eb0a20c51cc6d65b3a19a26ae76 +size 436375725 diff --git a/full_models/lac/config.json b/full_models/lac/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lac/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lac/vocab.txt b/full_models/lac/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..651242559e27b0d39dfaed0737f09505477a443f --- /dev/null +++ b/full_models/lac/vocab.txt @@ -0,0 +1,37 @@ +- +a +ó +r +ú +x +l +c +o +s +n +j +e +m +p +u +k + +í +g +_ +d +t +f +ñ +i +b +w +q +h +' +ʌ +é +z +y +á +v diff --git a/full_models/laj/D_100000.pth b/full_models/laj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..31487e95299f4540e112f5e526c61952e26e5b34 --- /dev/null +++ b/full_models/laj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e25dda044b900a27dbffd89f5f288ff9b2fcde96ce65101ee4601dda2667eb +size 561078851 diff --git a/full_models/laj/G_100000.pth b/full_models/laj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5ca5cc6f3d9c9c501cffae260cd0e7478692cb49 --- /dev/null +++ b/full_models/laj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1968571ed2c7475837a6e6fc82cbf7c9cf848fde5106c0fbab70b6444796ffe +size 436355748 diff --git a/full_models/laj/config.json b/full_models/laj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/laj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/laj/vocab.txt b/full_models/laj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..96df84e3ec0d84dc9d931c148b317e3d5b830fcc --- /dev/null +++ b/full_models/laj/vocab.txt @@ -0,0 +1,28 @@ +| +o +a +e +i +n +k +m +t +r +w +u +y +d +c +b +ŋ +l +p +g +j +- +' +f +v +s +h + diff --git a/full_models/lam/D_100000.pth b/full_models/lam/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..927ce784bfdbc04a001de0522360fd93d8f6a548 --- /dev/null +++ b/full_models/lam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6582200159f0dc967d6d9f70796a52e355618e44618aa7aa7811625e153b6420 +size 561078989 diff --git a/full_models/lam/G_100000.pth b/full_models/lam/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..97e39b673b8dbd4613a5cc31b7d873ddda31f6b5 --- /dev/null +++ b/full_models/lam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254b0d3ca0a0a6bf0794e581fdb83fe57ee71fbfbb4992ce7ca32d729886da15 +size 436360587 diff --git a/full_models/lam/config.json b/full_models/lam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lam/vocab.txt b/full_models/lam/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d372d74402eafbf649c65f48a672d9a3cc4e7767 --- /dev/null +++ b/full_models/lam/vocab.txt @@ -0,0 +1,29 @@ +a +| +i +u +e +l +k +n +m +ŵ +o +s +w +t +y +p +f +b +c +ŋ +d +g +' +j +- +— +v +ʼ + diff --git a/full_models/lao/D_100000.pth b/full_models/lao/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..eaa91fb0ce952a6b6a52b62fc09705be2cccdd89 --- /dev/null +++ b/full_models/lao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac4b954e32f36d0c1c61b7eedee668417d13e4f3e6b6c08b9651b0e659e5035 +size 561078765 diff --git a/full_models/lao/G_100000.pth b/full_models/lao/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..b56aea075d29649c775c3d6defec1c987364be86 --- /dev/null +++ b/full_models/lao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b212a2c67d73e9299067a528582206402d70de1da5e61166db5b8eb8990338d +size 436411894 diff --git a/full_models/lao/config.json b/full_models/lao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lao/vocab.txt b/full_models/lao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9057504f0832f120873142888cd473bbc46cbcdd --- /dev/null +++ b/full_models/lao/vocab.txt @@ -0,0 +1,51 @@ +ດ +ແ +ຝ +ໃ +ຍ +ຈ +- +ູ +ສ +ະ +ຣ +ບ +ຄ +ນ +ປ +ຜ +ຸ +' +້ +ົ +ິ +ຼ +ງ +ຂ +ີ + +_ +ຖ +າ +ັ +ທ +ໂ +ພ +ຫ +່ +ຟ +ື +ໍ +ວ +ຽ +ຶ +ຮ +ຢ +ເ +ລ +ຕ +ກ +ອ +ມ +ໄ +ຊ diff --git a/full_models/las/D_100000.pth b/full_models/las/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a4e83d419f32933ff900e5367ab17808e506e84 --- /dev/null +++ b/full_models/las/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:016ff0d61b28814104071dae0816f173c2276fdb0f779a768f05cd36866b14c7 +size 561078984 diff --git a/full_models/las/G_100000.pth b/full_models/las/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5686102034f8a71f6601b0a5187f1e3157b2f01e --- /dev/null +++ b/full_models/las/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f05f93115577cfade3d2224b713418c5b53b673693469df3d3dd798f4a1e0b +size 436366234 diff --git a/full_models/las/config.json b/full_models/las/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/las/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/las/vocab.txt b/full_models/las/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8246912760de17cf0118186bc9468ab23f725506 --- /dev/null +++ b/full_models/las/vocab.txt @@ -0,0 +1,32 @@ +| +a +e +n +t +s +ɛ +r +ɩ +i +k +ʋ +w +m +l +ɔ +ꞌ +- +p +y +o +u +ñ +c +ɖ +h +f +ŋ +' +đ +d + diff --git a/full_models/lat/D_100000.pth b/full_models/lat/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ef4aa11f89c070478f4b05f5f53121781e3f77f0 --- /dev/null +++ b/full_models/lat/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:151e5d05c06ced008cf5366a0d0085be2629f741b619a791e3272ef75764a757 +size 561079259 diff --git a/full_models/lat/G_100000.pth b/full_models/lat/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..48d05b26b4fecc14b4695e2b9443513747e6ab01 --- /dev/null +++ b/full_models/lat/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b142a51368521e63236b2489256e76d85fabd5904d42e4b67b8ee25310e0cb18 +size 436363168 diff --git a/full_models/lat/config.json b/full_models/lat/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lat/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lat/vocab.txt b/full_models/lat/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2bb75a90b81ef8eedfccc63c8badc40fd5773955 --- /dev/null +++ b/full_models/lat/vocab.txt @@ -0,0 +1,29 @@ +l +p +b +t +f +z +r +s +í + +_ +— +v +- +ì +c +d +h +i +g +x +n +q +a +m +o +y +u +e diff --git a/full_models/lav/D_100000.pth b/full_models/lav/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aa82f35355564501f8e80a4586a555682cd0f982 --- /dev/null +++ b/full_models/lav/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71825cc30ee6181500ffeb47b4b5185e0fcda4fca18216aeab676be25b9f879 +size 561110403 diff --git a/full_models/lav/G_100000.pth b/full_models/lav/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b7d5b82df5bc1f356ab4483ed23c59db77f771ec --- /dev/null +++ b/full_models/lav/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1576dd1da31aee138777e85ecc2906b4b31d204e5eed80118b2a3febc3efe89 +size 436617955 diff --git a/full_models/lav/config.json b/full_models/lav/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lav/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lav/vocab.txt b/full_models/lav/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..982e3d903433313e12ff9841b223ad76dbe0f6d0 --- /dev/null +++ b/full_models/lav/vocab.txt @@ -0,0 +1,37 @@ +u +a +v +ķ +b +d +p +o +z +ģ +č +š +h +i +ā +g +e +_ +ī + +– +c +s +f +l +ē +r +n +m +t +ū +k +- +ļ +ņ +ž +j diff --git a/full_models/law/D_100000.pth b/full_models/law/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5ee24c8cc5bb34b344e412257e4b79008b4fd2bf --- /dev/null +++ b/full_models/law/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e9bc580270870511886962797f5200627467a118d59d0db2a77b858062e6bf +size 561076156 diff --git a/full_models/law/G_100000.pth b/full_models/law/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aa7196ba2e4e5c1cfb2d1bc3b294788581fea195 --- /dev/null +++ b/full_models/law/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ecf7bfdb431004e811a5c5de24ae102fd32ba5ed442dc11a9bb0774a39f959 +size 436342063 diff --git a/full_models/law/config.json b/full_models/law/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/law/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/law/vocab.txt b/full_models/law/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..89498d9f4eb524f1354ac501ddcc1d9eb5e1ec2c --- /dev/null +++ b/full_models/law/vocab.txt @@ -0,0 +1,30 @@ +u +d +w +m +h +_ +l +' +b +r +s +o + +5 +e +` +j +y +k +g +t +9 +p +c +v +1 +n +a +8 +i diff --git a/full_models/lbj/D_100000.pth b/full_models/lbj/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d96ae102703edc40a73ca32b701c39f852d2f8e9 --- /dev/null +++ b/full_models/lbj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd156d93d9d3986f3930e4ec625dee47e72e0db97a7c002d97c4900b41388fda +size 561076025 diff --git a/full_models/lbj/G_100000.pth b/full_models/lbj/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0f1c4f49aa4ba37e20e27d54a5f763c4c330b03 --- /dev/null +++ b/full_models/lbj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21edd55ace6bf17c97458b97bb61f0bbc1818db1b77d35f1af1947507288d23 +size 436402852 diff --git a/full_models/lbj/config.json b/full_models/lbj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lbj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lbj/vocab.txt b/full_models/lbj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..42ab17ed3189000ceeb9ac4f60695866ff9dafac --- /dev/null +++ b/full_models/lbj/vocab.txt @@ -0,0 +1,57 @@ +་ +| +ས +ན +ི +ོ +ང +ད +ག +ེ +མ +ུ +བ +འ +ལ +ར +ཡ +ཁ +ཀ +ྱ +པ +ཏ +ཤ +ཞ +ཅ +ྲ +ཟ +ཆ +ཚ +ཕ +ླ +ྐ +ཱ +ྟ +ཉ +ཛ +ྒ +ཐ +ཧ +ཙ +ཨ +ྡ +ྔ +ཇ +ྤ +ྩ +ྙ +ྕ +ྨ +ྫ +ྣ +ྗ +ྭ +ྦ +ྷ +ཝ + diff --git a/full_models/lbw/D_100000.pth b/full_models/lbw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d7bbd92d5f86566593e4528d4ce129759660c1bf --- /dev/null +++ b/full_models/lbw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf01a9541bdeb86c9e958650ef36c5f7a16d5f529b4a42fcccd3c0b4e0039d87 +size 561078860 diff --git a/full_models/lbw/G_100000.pth b/full_models/lbw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6e300138b81b2111ddab3ecce5bd39df0784eead --- /dev/null +++ b/full_models/lbw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce36fe3f6adeb71a15debbcfd703cfd777c64baeba6f67469e0b8aa22398314 +size 436350708 diff --git a/full_models/lbw/config.json b/full_models/lbw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lbw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lbw/vocab.txt b/full_models/lbw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..77d074b031eaed161319f5a295270e10768bd472 --- /dev/null +++ b/full_models/lbw/vocab.txt @@ -0,0 +1,25 @@ +s +h +' +b +m +w +a +n +- +y +i +k +d +l +e + +_ +o +r +p +g +t +j +u +c diff --git a/full_models/lcp/D_100000.pth b/full_models/lcp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c29e47bfe93cfe6b6a947a50b2f918edc30ae896 --- /dev/null +++ b/full_models/lcp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63742260c7ee65892b00063d4a1b8195ce0dca7dfa9db0f3708ff4ad92b89621 +size 561079259 diff --git a/full_models/lcp/G_100000.pth b/full_models/lcp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0bd2e3b18d4c11883f514e671df4386a78d51c41 --- /dev/null +++ b/full_models/lcp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0fd12893654cb53d874a863049d37fc712f3c48820fc92e92c76e3de2d5dba4 +size 436392387 diff --git a/full_models/lcp/config.json b/full_models/lcp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lcp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lcp/vocab.txt b/full_models/lcp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..07fce5dbb9325c629721b8e76bb60b0f17029fc2 --- /dev/null +++ b/full_models/lcp/vocab.txt @@ -0,0 +1,42 @@ +ค +ฌ +ด +ะ +_ +ซ +จ +แ +ฮ +ั +ร +k +พ +ิ +โ +ฆ +ช + +ย +า +ี +ต +ึ +ท +ว +่ +ื +ญ +ม +ป +ก +ุ +' +เ +ง +ู +น +อ +ฟ +ไ +ล +บ diff --git a/full_models/lee/D_100000.pth b/full_models/lee/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..09b960889abeefa63959f5c229a94e6d1e119d6f --- /dev/null +++ b/full_models/lee/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c747d8ad4ca75f154b72fd5adb0a5f7dfa0cb8ba3c7fd3080e9a49d1b750d10 +size 561078701 diff --git a/full_models/lee/G_100000.pth b/full_models/lee/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e487d43865a8500c9e90fc9bebb06300f2f6cb13 --- /dev/null +++ b/full_models/lee/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ca7cd0e3d346a1bd59683e561645805c5895b558903ba86e8dd9258fd5cf3d +size 436438217 diff --git a/full_models/lee/config.json b/full_models/lee/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lee/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lee/vocab.txt b/full_models/lee/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4429b34cd635330685320b946f1dab9c815ee023 --- /dev/null +++ b/full_models/lee/vocab.txt @@ -0,0 +1,64 @@ +| +ə +n +́ +̀ +y +ɛ +b +w +m +l +ɔ +r +a +d +i +á +z +à +s +h +k +c +t +' +í +ì +g +é +ń +ǹ +̃ +e +ó +ù +u +- +j +p +ò +ú +̌ +è +ẽ +ǎ +ê +ã +ǐ +v +â +ĩ +ŋ +f +o +õ +ǔ +ě +ũ +ô +ǒ +ṹ +ṍ +̂ + diff --git a/full_models/lef/D_100000.pth b/full_models/lef/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..68fc4bae11c230dedca881a29fec63fed550d3cb --- /dev/null +++ b/full_models/lef/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326c47924cedbe96382ff7f82f87fe31bcb00c840f063f7522abcefbbc01ee39 +size 561078850 diff --git a/full_models/lef/G_100000.pth b/full_models/lef/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..387d63a001f71bbbf79b29346f3225167ddfc658 --- /dev/null +++ b/full_models/lef/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7fa8e637b497e98f844e5d08b7bc03109cae6af2bd3712f49cae90b28b8aef6 +size 436378222 diff --git a/full_models/lef/config.json b/full_models/lef/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lef/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lef/vocab.txt b/full_models/lef/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..353b8e233655fffedacd4952924448d4de3cb3e1 --- /dev/null +++ b/full_models/lef/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +n +ɔ +u +k +b +l +e +m +ɛ +t +d +y +s +o +w +- +ƒ +́ +p +g +á +ú +é +r +v +í +' +h +ó +ń +ḿ +6 +2 + diff --git a/full_models/lem/D_100000.pth b/full_models/lem/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1205c1359154ab72d10ed7aaf7c9ce5b6505974 --- /dev/null +++ b/full_models/lem/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1ed2b7681a4282992d06f6f012a728a7db292548041b434aeea9e794d68d64 +size 561078735 diff --git a/full_models/lem/G_100000.pth b/full_models/lem/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7237b309d88ca9510abe0fcc4c056aa27316c260 --- /dev/null +++ b/full_models/lem/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b1b34cd4d3fe6f381dcd72902df73b2a3b03cd9fdd5ffd1829307b71a4ecfbb +size 436369093 diff --git a/full_models/lem/config.json b/full_models/lem/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lem/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lem/vocab.txt b/full_models/lem/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a681822d41a18c680fbdbca69cea54c3dcf704f6 --- /dev/null +++ b/full_models/lem/vocab.txt @@ -0,0 +1,34 @@ +| +a +n +ɔ +́ +b +á +ɛ +e +m +y +i +í +k +é +t +ŋ +u +l +s +ú +c +h +o +w +ó +d +f +j +g +ʼ +- +' + diff --git a/full_models/lew/D_100000.pth b/full_models/lew/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a7ccc484aaa98ea6e0994d775d0fafb4e978e29d --- /dev/null +++ b/full_models/lew/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e09bfde4a433b320c3ccccb3ce6ee815539c2a6557c62cb76e68d31846c6829 +size 561078743 diff --git a/full_models/lew/G_100000.pth b/full_models/lew/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..68473e269ff50d7c77108ad963ca4f27f36c5192 --- /dev/null +++ b/full_models/lew/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978cd36c3ce3a9cbc50d918639aa6a974cb06aff214a6796a5834e20283d3c68 +size 436371386 diff --git a/full_models/lew/config.json b/full_models/lew/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lew/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lew/vocab.txt b/full_models/lew/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9e603a83e15b5d77e4e40e695eea428ef1f8337e --- /dev/null +++ b/full_models/lew/vocab.txt @@ -0,0 +1,34 @@ +a +| +n +i +u +o +m +t +e +p +r +s +k +l +b +g +d +y +v +h +- +j +f +˻ +˼ +z +c +w +' +1 +— +9 +2 + diff --git a/full_models/lex/D_100000.pth b/full_models/lex/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5a2bc401e97bb584098bdd1f9019f5a31c97033d --- /dev/null +++ b/full_models/lex/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a2d51cb3f797fa1d335ff4d8697d45a3b0b4da01392562d482fc5e7391bf1cf +size 561078612 diff --git a/full_models/lex/G_100000.pth b/full_models/lex/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9411190e277cabcbdb7239de5d69ac89336a1dba --- /dev/null +++ b/full_models/lex/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc801b9673aa99e90b9d24c1870d0da4a12005fad0b7c3f733f4f0fc9d697d7 +size 436352955 diff --git a/full_models/lex/config.json b/full_models/lex/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lex/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lex/vocab.txt b/full_models/lex/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b4377f634abc4bc1e27ed1724117cc766e13931e --- /dev/null +++ b/full_models/lex/vocab.txt @@ -0,0 +1,27 @@ +_ +l +e +i +a +o +c +t +w +b +m +k +j +p +s +n +h +u +' +z +r +f +g + +y +- +d diff --git a/full_models/lgg/D_100000.pth b/full_models/lgg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..25e73be991793c002c28157e6db8413a03e0981a --- /dev/null +++ b/full_models/lgg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5813cf25cf02d0d3c834adf6770ff30e96bf11b4e6930570f61836259d9b2788 +size 561079103 diff --git a/full_models/lgg/G_100000.pth b/full_models/lgg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be7783d7336d54fe11c467bfa34be6aa54e9c7b5 --- /dev/null +++ b/full_models/lgg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6403c59582678f3afc51c6c957855e6a62f8e2c851b11029c705300548676bf2 +size 436372939 diff --git a/full_models/lgg/config.json b/full_models/lgg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lgg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lgg/vocab.txt b/full_models/lgg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..58e0a8e0af27b23e81e55b085132a5b902f25c97 --- /dev/null +++ b/full_models/lgg/vocab.txt @@ -0,0 +1,34 @@ +| +i +a +e +r +u +n +o +m +d +y +l +k +b +z +t +s +p +g +' +v +f +c +j +w +h +­ +- +0 +1 +5 +3 +q + diff --git a/full_models/lgl/D_100000.pth b/full_models/lgl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c66b674ce692f7f23f0ece772965ebd9739d4e01 --- /dev/null +++ b/full_models/lgl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7199e3c655b92104e89521b93b2a162dfb0025893ceb0d8d9baa998d9c781122 +size 561078715 diff --git a/full_models/lgl/G_100000.pth b/full_models/lgl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fad9cdcff8b48a7ce8d31234ade4d1c14e9567a8 --- /dev/null +++ b/full_models/lgl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:732069ea48b727bf6c8728bef7ed9ec28317ba9259f5a451240927034749cd2c +size 436368941 diff --git a/full_models/lgl/config.json b/full_models/lgl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lgl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lgl/vocab.txt b/full_models/lgl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2a588f2016b81465d9d5f6d65c7ee74947563e6c --- /dev/null +++ b/full_models/lgl/vocab.txt @@ -0,0 +1,34 @@ +2 +d +w +u +e +i +n +g +a +c +5 +_ +m +k +1 + +f +y +l +3 +p +s +r +o +0 +h +b +- +v +4 +j +' +ꞌ +t diff --git a/full_models/lhu/D_100000.pth b/full_models/lhu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e6f6a1bd0057b88431cc13d9cf9054f03b82d2ed --- /dev/null +++ b/full_models/lhu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dca9f63dac703d76b5eb3a429f35d468dee69ac927c9b1d130821265028247d +size 561078603 diff --git a/full_models/lhu/G_100000.pth b/full_models/lhu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2a4967bb25188c26703073b3c1ee7572c3e55bd9 --- /dev/null +++ b/full_models/lhu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb9d009b9216bae3e5ba4273d98b0f62f804734bfae9bf263f7c1634a42ac21 +size 436364351 diff --git a/full_models/lhu/config.json b/full_models/lhu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lhu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lhu/vocab.txt b/full_models/lhu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0a5ccb9b5816435d1dc0195d5f53c00ebe0bf0c7 --- /dev/null +++ b/full_models/lhu/vocab.txt @@ -0,0 +1,32 @@ +| +a +h +e +ˬ +w +t +u +i +v +o +k +' +l +y +n +ˍ +p +c +g +m +ˆ +s +ˉ +d +b +- +j +r +f +z + diff --git a/full_models/lia/D_100000.pth b/full_models/lia/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4869efad89331774264dfef65e9ceb67a6fb4459 --- /dev/null +++ b/full_models/lia/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369d98f1b175de3245eb8fbe05ca03c7f747163cf5d81f84ea1d2292d1612fbb +size 561078708 diff --git a/full_models/lia/G_100000.pth b/full_models/lia/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..821e682761805df73c1a1d14d195fdf1b3b1e85d --- /dev/null +++ b/full_models/lia/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e135597e9cd56ea0013db6891d2ba28fadef8125761ffdf1090da436485080 +size 436355241 diff --git a/full_models/lia/config.json b/full_models/lia/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lia/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lia/vocab.txt b/full_models/lia/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..37a703c4efb2844520bb0373161e978946b216ce --- /dev/null +++ b/full_models/lia/vocab.txt @@ -0,0 +1,28 @@ +| +a +i +n +ŋ +k +b +ɛ +e +y +m +t +ɔ +h +u +o +d +w +s +l +r +p +g +f +- +— +' + diff --git a/full_models/lid/D_100000.pth b/full_models/lid/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0c5c6ff093b37d1fef46023aabae5b946082f841 --- /dev/null +++ b/full_models/lid/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1188edefadd7732f339ef32ffc64314deed69aa6ee7f92e7442732d575e7d6c +size 561078456 diff --git a/full_models/lid/G_100000.pth b/full_models/lid/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f182781767eb3e3b4bb8d10d7b4764ea28ba3eb3 --- /dev/null +++ b/full_models/lid/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7326716138e794eeb1065f7030c9b81e74bbba7399effcb504e49d26a05ad37 +size 436371384 diff --git a/full_models/lid/config.json b/full_models/lid/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lid/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lid/vocab.txt b/full_models/lid/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1bde0e3062d30e1ff800583168a26db116581a36 --- /dev/null +++ b/full_models/lid/vocab.txt @@ -0,0 +1,35 @@ +y +1 +d +r +- +n +s +m +t +g +4 +b +9 +e +w +6 +_ + +5 +j +i +a +k +0 +3 +p +o +8 +' +7 +u +2 +h +– +l diff --git a/full_models/lif/D_100000.pth b/full_models/lif/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d7a1d7ba3e2f1df60d89729e3afd9166600f0419 --- /dev/null +++ b/full_models/lif/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bca0228f6037442e1b41f8f3f9ae863f3c99908d388b372900f7382e97485b2 +size 561076202 diff --git a/full_models/lif/G_100000.pth b/full_models/lif/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b658f762a01a5ac2e4e73f4f93f6c47297a6268 --- /dev/null +++ b/full_models/lif/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05df655b555c988261ceb628e318ceceb6ebc2a2cf8a6ac387021c08e168a523 +size 436388267 diff --git a/full_models/lif/config.json b/full_models/lif/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lif/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lif/vocab.txt b/full_models/lif/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d15f7a951f272a3995f40dc0fa1dbae64081c079 --- /dev/null +++ b/full_models/lif/vocab.txt @@ -0,0 +1,50 @@ +् +| +ा +े +़ +‍ +क +न +म +ङ +ि +ु +ल +ॽ +स +ः +ो +र +त +ब +प +ह +य +ख +आ +ग +व +द +इ +फ +थ +च +ज +ओ +छ +भ +ध +ए +घ +अ +उ +– +- +ै +' +ौ +­ +६ +— + diff --git a/full_models/lip/D_100000.pth b/full_models/lip/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..681bb3149fd04157c950949384d780d4f4c60825 --- /dev/null +++ b/full_models/lip/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7731253a0ebcb84d5fa82e6a1a5e37673b1ae34a86c739bcf310bd027339daab +size 561078986 diff --git a/full_models/lip/G_100000.pth b/full_models/lip/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1a98d2aad84e54ad90315bf258638337948b6121 --- /dev/null +++ b/full_models/lip/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc18d32a87668614c2b06779c939429d42f6dfb8608e2ac7ceb7f4307bd48b19 +size 436396138 diff --git a/full_models/lip/config.json b/full_models/lip/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lip/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lip/vocab.txt b/full_models/lip/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f3b4561b05bf065cc50bae6a2a290bada1fba50f --- /dev/null +++ b/full_models/lip/vocab.txt @@ -0,0 +1,44 @@ +| +ǝ +a +i +n +e +k +o +b +s +t +u +y +l +m +f +ɛ +ɔ +d +w +p +á +é +í +ó +ú +r +́ +ń +h +ã +g +v +̃ +- +ũ +z +ĩ +ḿ +à +ẽ +' +̀ + diff --git a/full_models/lis/D_100000.pth b/full_models/lis/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ece4315809eda38365c0c78ae116e88ea150e569 --- /dev/null +++ b/full_models/lis/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4a016337d0562a67eff816311ec455895c85665d9fbfef103d2a6dd9059700 +size 561078889 diff --git a/full_models/lis/G_100000.pth b/full_models/lis/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d7ff20df7eaa28fbb79de7dfb4a189247422ec61 --- /dev/null +++ b/full_models/lis/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a81089cbcef39b5c9f08e2d2924412f94518d2815da6bb68aea9cb3c84785dc +size 436421655 diff --git a/full_models/lis/config.json b/full_models/lis/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lis/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lis/vocab.txt b/full_models/lis/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a7f70ab9f53788e87d0cf0508a67e8703773b182 --- /dev/null +++ b/full_models/lis/vocab.txt @@ -0,0 +1,55 @@ +ꓤ +ꓖ +ꓡ +ꓺ +ꓣ +ꓶ +ꓢ +s +ꓥ +x +ꓙ +ꓕ +ꓛ +ꓫ +ꓳ +ꓪ +ꓵ +ꓱ +ˍ +ꓑ +ꓘ +ꓔ +ꓦ +ꓻ +ꓗ +ꓧ +ꓯ +ꓟ +ꓩ + +ꓲ +ꓹ +b +ꓐ +' +g +ꓒ +- +ꓝ +ꓼ +ꓬ +ꓽ +ꓷ +ꓴ +_ +ꓰ +ꓓ +ꓜ +ꓮ +ꓠ +w +ꓸ +ꓚ +ꓞ +z diff --git a/full_models/lje/D_100000.pth b/full_models/lje/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..39dcea67e95dd35706769b536e460aba84e2b7d3 --- /dev/null +++ b/full_models/lje/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fabce48afc385d53fc871eb3b5564c61e9f5f4bed9caab0d167ab391ea3a8664 +size 561078729 diff --git a/full_models/lje/G_100000.pth b/full_models/lje/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c2870f052787fd2ca659df64b9e1412460fd4bcf --- /dev/null +++ b/full_models/lje/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feb34389aa27ebdaca66e466f022cc9a90a0d7e394672df89459da6216de7b4c +size 436371260 diff --git a/full_models/lje/config.json b/full_models/lje/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lje/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lje/vocab.txt b/full_models/lje/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8e640afa85d0c0241fb76e118b7dd3480645826a --- /dev/null +++ b/full_models/lje/vocab.txt @@ -0,0 +1,35 @@ +b +j +t +g +5 +w +e +c +o +_ +7 +3 +n +p +h +u +4 +i +ꞌ +r +1 +d +l +2 +a +- +y +s +f +6 +k + +m +' +0 diff --git a/full_models/ljp/D_100000.pth b/full_models/ljp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..04a79461bc593e05a51f4a8dbac294abb765126a --- /dev/null +++ b/full_models/ljp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2353aaf50c65945193df1434faccc7acdf934ad889d54b36c25a2936fe98931 +size 561078847 diff --git a/full_models/ljp/G_100000.pth b/full_models/ljp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6a2ab4bd02ece290e082c2d840bd21dc5e382f39 --- /dev/null +++ b/full_models/ljp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd802eb725c4bdec7dcbc8afc2ac483eb8514aec13e8a7e0947a39b5b78efabb +size 436373241 diff --git a/full_models/ljp/config.json b/full_models/ljp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ljp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ljp/vocab.txt b/full_models/ljp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bbc9f501ba401042cd9c2addc1b1804fc55a4c38 --- /dev/null +++ b/full_models/ljp/vocab.txt @@ -0,0 +1,35 @@ +a +| +i +n +k +u +e +m +l +s +t +r +g +d +h +j +o +b +p +y +- +w +c +f +z +' +0 +v +4 +6 +1 +2 +3 +ë + diff --git a/full_models/llg/D_100000.pth b/full_models/llg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a8acdd51221e3f3dcc4f84ab6a02faae15de7a37 --- /dev/null +++ b/full_models/llg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e457e97ba99be3f9d3e97532dc4cee2360cb74829b4fb72fd5463b4ff908e07 +size 561076029 diff --git a/full_models/llg/G_100000.pth b/full_models/llg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7c55a230f076b2864517264bfba8fc0f59e3d79e --- /dev/null +++ b/full_models/llg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca97baefe5ea8da2ab7e226ba4c75007f9e04c902277dbe7ecfd513cefaf0622 +size 436331339 diff --git a/full_models/llg/config.json b/full_models/llg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/llg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/llg/vocab.txt b/full_models/llg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..04f2b870161d6be2f1045de395a53d190bb1677f --- /dev/null +++ b/full_models/llg/vocab.txt @@ -0,0 +1,26 @@ +l +- +b +i +g +n +a +_ +d +s +t + +o +c +k +y +m +f +e +' +x +r +h +p +w +u diff --git a/full_models/lln/D_100000.pth b/full_models/lln/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cffd0c4c4b3398bab6d138fc548811c4e75e6296 --- /dev/null +++ b/full_models/lln/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200fc0e8a8401b136e0c985b3614595c63604227d70cb93b50378629298ac869 +size 561078716 diff --git a/full_models/lln/G_100000.pth b/full_models/lln/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9a9f49bb98ac9dca0111931310ca3366ef568de5 --- /dev/null +++ b/full_models/lln/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae45e9a9d799104cac3052a05a4f7a10c22c655ae5f1df1a59537c57ef615a48 +size 436375051 diff --git a/full_models/lln/config.json b/full_models/lln/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lln/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lln/vocab.txt b/full_models/lln/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1578868b9a1a30652347f7ef644acc7686087311 --- /dev/null +++ b/full_models/lln/vocab.txt @@ -0,0 +1,36 @@ +ỹ +' +l +p +r +s +i +g +h +u +á +í +ɓ +ú +- +j +w +̃ +t +m +b +ó +c +k + +_ +a +é +y +e +d +ɗ +ŋ +n +o +` diff --git a/full_models/lme/D_100000.pth b/full_models/lme/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..87ae64a94d46552a1cb2d3ba43e87ea959c27977 --- /dev/null +++ b/full_models/lme/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c637c5cc40d8a77bae11661621415588e3b62106badbe35a8e5bd617d99b91 +size 561078609 diff --git a/full_models/lme/G_100000.pth b/full_models/lme/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9e411c8873f28c36fcc1226b576bba7b6976d8f4 --- /dev/null +++ b/full_models/lme/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d477a9c6d6d507854a0e2aaf88c267cde06edd2e5434a61eb18be2fcb5f0e9c +size 436375981 diff --git a/full_models/lme/config.json b/full_models/lme/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lme/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lme/vocab.txt b/full_models/lme/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2777b682acd76a166ae4b57d6104a2d2a90ad2c7 --- /dev/null +++ b/full_models/lme/vocab.txt @@ -0,0 +1,37 @@ +| +a +ə +n +m +i +u +k +w +r +d +y +s +e +' +b +o +t +z +h +ɓ +g +c +f +â +ŋ +l +v +ɗ +ô +j +p +î +û +ê +- + diff --git a/full_models/lnd/D_100000.pth b/full_models/lnd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4421781e44e7f25987c6aa9f044b4be3255f7413 --- /dev/null +++ b/full_models/lnd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f4426d4ed2edcd2fc20c5241bedd8450de0fe1d0624a6b75c8854a8fd39d54 +size 561078848 diff --git a/full_models/lnd/G_100000.pth b/full_models/lnd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..059e6c58cd4f6986ec78f5f6642b2fca78b2308a --- /dev/null +++ b/full_models/lnd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9244a2262c00f97613570a22e198f0ed01131af689187574d0655427a189acd8 +size 436376586 diff --git a/full_models/lnd/config.json b/full_models/lnd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lnd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lnd/vocab.txt b/full_models/lnd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24eca94aeebbf949ca1c4d80d4a510b9b3d3e3fd --- /dev/null +++ b/full_models/lnd/vocab.txt @@ -0,0 +1,36 @@ +- +4 +r +k +v +c +e +t +b +2 +y +p +i +u +_ +' +1 +w +j +s +h +d + +5 +m +— +8 +é +0 +n +a +6 +7 +g +o +l diff --git a/full_models/lns/D_100000.pth b/full_models/lns/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1dd99dc6d3d26e84c8f271df5966e614a9029f8b --- /dev/null +++ b/full_models/lns/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555316b05994b03c725a81fb0ce26198963d4428f1319240e7503d1843902f7f +size 561079278 diff --git a/full_models/lns/G_100000.pth b/full_models/lns/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dce496011a34d89fce8ac19af728e406af930a85 --- /dev/null +++ b/full_models/lns/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa68795d6cb528646f0cc8d8d792a085d05d388204d74d706a44c549c13c4f7 +size 436405994 diff --git a/full_models/lns/config.json b/full_models/lns/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lns/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lns/vocab.txt b/full_models/lns/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..555e3ec03058a01d84ad036dd526e9dc3885b9b8 --- /dev/null +++ b/full_models/lns/vocab.txt @@ -0,0 +1,48 @@ +ó +u +y +ə +ǒ +k +b +ǔ +s +e +ŋ +l +̀ +ù +ú +n +c +ʼ +a +o +- +ǎ +ò +ì +z +m +̌ + +d +é +r +i +h +á +v +t +_ +í +è +g +à +ǐ +j +w +ě +́ +f +p diff --git a/full_models/lob/D_100000.pth b/full_models/lob/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a7f7a919a23cfc56e98d5b7a5f4ce38556dd65d2 --- /dev/null +++ b/full_models/lob/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff4daa22791937aefb407d1f2e7d342bfeedd7e884ec970a7660d58431356df1 +size 561078582 diff --git a/full_models/lob/G_100000.pth b/full_models/lob/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f4729d8e025dad19215b336d5cb65ebc1bd63079 --- /dev/null +++ b/full_models/lob/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7fbc2a03adb96a2faf0f85c248cfec1108be8be2a1beb7a62ca680744bca907 +size 436387382 diff --git a/full_models/lob/config.json b/full_models/lob/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lob/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lob/vocab.txt b/full_models/lob/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..58b0d84f3e6bfb3460a70f9c5dac3b81dd0e96ae --- /dev/null +++ b/full_models/lob/vocab.txt @@ -0,0 +1,42 @@ +| +a +ɩ +n +ɛ +r +ɔ +k +h +d +t +b +g +ʋ +l +o +i +s +e +̃ +p +m +ι +u +w +j +f +ã +- +y +c +' +ə +ƴ +ũ +ẽ +õ +ɓ +ĩ +v +ǝ + diff --git a/full_models/lok/D_100000.pth b/full_models/lok/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..15b716293fcea8b7afb1d343c8e974220a0d0200 --- /dev/null +++ b/full_models/lok/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a8eea8f7bf85f32706673c3ed62605c5edfdcbfd33f9de95e8f81be66e4bdb2 +size 561079007 diff --git a/full_models/lok/G_100000.pth b/full_models/lok/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..822b6ef0512d6f919bb87bafc3c0eab3db7fd1ac --- /dev/null +++ b/full_models/lok/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f19b33851cd67c9f6e8913a18460022d17d04e397d0d74ac4827b851c532619 +size 436361041 diff --git a/full_models/lok/config.json b/full_models/lok/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lok/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lok/vocab.txt b/full_models/lok/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3aa0db5682f85b15f94eb9ec5dc368e8b1c77891 --- /dev/null +++ b/full_models/lok/vocab.txt @@ -0,0 +1,29 @@ +w +e +a +ɔ +l +s +b +d +j +f +o +m +y +i +t +c +_ +n +k +' +g + +h +u +` +p +- +ɛ +q diff --git a/full_models/lom/D_100000.pth b/full_models/lom/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e3f64809e4a3b60f0e72ac0831d9adccc290308c --- /dev/null +++ b/full_models/lom/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a76c9ad13053baedfacddfd7f7b4f4d958e4abc4331312401fc623696b76a2 +size 561078601 diff --git a/full_models/lom/G_100000.pth b/full_models/lom/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d55f0295a3cf791296bfd1207efd1cb102d8f2e4 --- /dev/null +++ b/full_models/lom/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed02091f06e3e760416cb35633fd5ff70be302193dd26036f1b1329b628f5480 +size 436422072 diff --git a/full_models/lom/config.json b/full_models/lom/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lom/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lom/vocab.txt b/full_models/lom/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..489e5fb44ed53b00acee48f87987edd50d5ba823 --- /dev/null +++ b/full_models/lom/vocab.txt @@ -0,0 +1,57 @@ +| +a +i +ɛ +l +e +n +u +g +t +ɔ +o +w +z +ɣ +m +v +k +‐ +é +s +d +y +p +ƃ +ʋ +b +f +ŋ +è +á +à +̀ +́ +ũ +̃ +õ +í +ã +ì +j +ú +h +ù +ẽ +ĩ +ó +ò +ẁ +— +' +ẃ +ɓ +c +ê +- + diff --git a/full_models/lon/D_100000.pth b/full_models/lon/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..abb049c4c0c3272110125dfba80429b6347ab2ad --- /dev/null +++ b/full_models/lon/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8cfde6a7178280b83517932d194f98f85baa8b0b031d4a125fde44f0777e06 +size 561079130 diff --git a/full_models/lon/G_100000.pth b/full_models/lon/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..45370b420b23886c096fbae46ed41e1b421773aa --- /dev/null +++ b/full_models/lon/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20995c4f8d038a38752188c2e9e9eeb85c3385a318191a28ff064bce301c2f00 +size 436380552 diff --git a/full_models/lon/config.json b/full_models/lon/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lon/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lon/vocab.txt b/full_models/lon/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..61d03572d0b9d0037f9e5b42f1d658c6b7b349d7 --- /dev/null +++ b/full_models/lon/vocab.txt @@ -0,0 +1,37 @@ +2 +o +w +8 +0 +7 +s +' +6 +y +v +b +_ +4 +c +n +r +u +i +3 +9 +z +h +g +f +j +l + +a +m +e +d +p +1 +5 +t +k diff --git a/full_models/loq/D_100000.pth b/full_models/loq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fbab164d3ba65c25afc591adcfdbc7e7be3f9f51 --- /dev/null +++ b/full_models/loq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3697af2f9a3117e667ddf46d4eafbdd94e12825e67bdda3eb2a5d4a999b0d363 +size 561076208 diff --git a/full_models/loq/G_100000.pth b/full_models/loq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f9b58eacdde7514750d35bbf520cbdf2bb2103d7 --- /dev/null +++ b/full_models/loq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:171da2f1d3f44e818be8dcb634ee15c49200f454af3644fce038e64a88c916c0 +size 436353603 diff --git a/full_models/loq/config.json b/full_models/loq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/loq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/loq/vocab.txt b/full_models/loq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..948add0ae54f3bd4fd5289d5c2e613224da81445 --- /dev/null +++ b/full_models/loq/vocab.txt @@ -0,0 +1,35 @@ +v +f +w + +ɔ +i +ŋ +a +́ +g +b +̣ +e +p +' +_ +t +̀ +k +d +h +é +r +y +ɛ +n +m +s +z +- +l +u +o +ɓ +ó diff --git a/full_models/lsi/D_100000.pth b/full_models/lsi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..92598ac49f97e3a8254b0620f775dabc31268508 --- /dev/null +++ b/full_models/lsi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f99114ee396466dbe6b7001a198d3866f40971161e9a0dda71aa7d2020cf0e +size 561078611 diff --git a/full_models/lsi/G_100000.pth b/full_models/lsi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a71a0fd2c2daeb2940f40af8d8d435aa9032fa50 --- /dev/null +++ b/full_models/lsi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf4406eff2d02d76c2eeb3a0acacfee9af6ff92263269cbffc6a67499e343f8 +size 436380504 diff --git a/full_models/lsi/config.json b/full_models/lsi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lsi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lsi/vocab.txt b/full_models/lsi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6cd859d4a231a243aabd3fffb83b0a4c29175b28 --- /dev/null +++ b/full_models/lsi/vocab.txt @@ -0,0 +1,39 @@ +l +7 +f +- +q +p + +y +h +e +0 +6 +k +3 +x +a +n +5 +i +w +1 +u +j +_ +2 +g +o +' +z +c +s +` +b +d +4 +v +t +m +r diff --git a/full_models/lsm/D_100000.pth b/full_models/lsm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..af9e358fa977d10da6f1624a5342bd862244b1c1 --- /dev/null +++ b/full_models/lsm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79ffbaa8da2bd836c45d38acc791eca58b20cd6f31524bae79b21825c84a5ac +size 561078847 diff --git a/full_models/lsm/G_100000.pth b/full_models/lsm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6acab95e1ce0999911f7b1944e15758cbf517862 --- /dev/null +++ b/full_models/lsm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7550dc0571075486d04c4c4f7aec57b46699a47cca20dd8774fd547c0b7c75a +size 436371124 diff --git a/full_models/lsm/config.json b/full_models/lsm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lsm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lsm/vocab.txt b/full_models/lsm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f78020670ee589c8450c47bed1ad4c3bd9bdf4e8 --- /dev/null +++ b/full_models/lsm/vocab.txt @@ -0,0 +1,33 @@ +a +| +i +e +o +n +u +b +h +l +m +y +s +w +r +d +k +t +g +c +' +f +j +- +p +0 +1 +2 +4 +5 +3 +q + diff --git a/full_models/luc/D_100000.pth b/full_models/luc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eb9705a0898f262b410b52d35a3a2da5ac92e852 --- /dev/null +++ b/full_models/luc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f16e85f7de60967c3a731630662dbd7e63f34c773fed7115aacd7752c569761 +size 561079009 diff --git a/full_models/luc/G_100000.pth b/full_models/luc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c337a3fa34c0d2aba2e0e194925217e486d883d8 --- /dev/null +++ b/full_models/luc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5821613b50468157407b3a1dd841d0ea940656d82715cefcec6f2e4479d5af6 +size 436429438 diff --git a/full_models/luc/config.json b/full_models/luc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/luc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/luc/vocab.txt b/full_models/luc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5e32a616b34380ce55a459794a71c1552215a571 --- /dev/null +++ b/full_models/luc/vocab.txt @@ -0,0 +1,59 @@ +6 +n +e +ã +a +ô +' +s +ê +p +î +3 +â +i +ộ +_ +- +í +́ + +2 +4 +á +ó +ŋ +ĩ +ụ +o +v +h +ọ +õ +l +ị +u +ẽ +w +ẹ +ệ +y +t +f +û +m +0 +j +ú +k +z +c +d +é +ũ +1 +̂ +g +b +r +̃ diff --git a/full_models/lug/D_100000.pth b/full_models/lug/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..386012ce33cc18f8ba6eb27e05facc4af79d8842 --- /dev/null +++ b/full_models/lug/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5450f642ad2ae1f48a20b7747638955183c03f67cbd5cb24809afa5d0f14238a +size 561110385 diff --git a/full_models/lug/G_100000.pth b/full_models/lug/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..afa60849183322d589f0a917ef031728dc7b984c --- /dev/null +++ b/full_models/lug/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5206f861527482b570693af3eff1ee61050f48ca9375bf0ac22dfb21e30452df +size 436600451 diff --git a/full_models/lug/config.json b/full_models/lug/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lug/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lug/vocab.txt b/full_models/lug/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..3e8ec68774d849384a39939d61e41844f1154450 --- /dev/null +++ b/full_models/lug/vocab.txt @@ -0,0 +1,30 @@ +z +e +d +f +p +c +4 +j +s +g +r +- +n +w +a +b +k +y +_ +t +o +ŋ + +' +l +h +v +i +u +m diff --git a/full_models/lwo/D_100000.pth b/full_models/lwo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f592f3db573a4569e37c97421e20409ba679640 --- /dev/null +++ b/full_models/lwo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19bc7e627b0c93c12aa31ad8daba4fc1d1888956214a56811b645ed695f5c63e +size 561078716 diff --git a/full_models/lwo/G_100000.pth b/full_models/lwo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff1b8983762b4cf3fc61b938816836154c6336a1 --- /dev/null +++ b/full_models/lwo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19359d7329472291b9806f3208d3faa545e5966f54213b3e78b76d5a2dc96807 +size 436355283 diff --git a/full_models/lwo/config.json b/full_models/lwo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lwo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lwo/vocab.txt b/full_models/lwo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..118bdd613e137a72c7c48a958fdd1e387816ed38 --- /dev/null +++ b/full_models/lwo/vocab.txt @@ -0,0 +1,28 @@ +| +a +e +n +h +o +g +i +u +y +d +k +r +m +w +b +j +c +t +l +p +' +q +0 +s +1 +5 + diff --git a/full_models/lww/D_100000.pth b/full_models/lww/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9431599dd9a96b32d0b133494caedd05d67f0f96 --- /dev/null +++ b/full_models/lww/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70c174fa32d46724829a33f048d07f847ad81b271c4ff888ad3d185e231e8c92 +size 561076204 diff --git a/full_models/lww/G_100000.pth b/full_models/lww/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e70e2893f053bd9b292f91920baaf9513a978aa2 --- /dev/null +++ b/full_models/lww/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14e5f7cfe6a4145b676992aa75e1e82b5c3ef51a41f7785f6b6dfd6cbace51d9 +size 436348989 diff --git a/full_models/lww/config.json b/full_models/lww/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lww/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lww/vocab.txt b/full_models/lww/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d9e6cae0bae1851e54cc812f08df173efc5b86fb --- /dev/null +++ b/full_models/lww/vocab.txt @@ -0,0 +1,33 @@ +8 +4 +g +a +y +k +x +2 +w +- +̃ +1 +s +0 +i +3 +r +n +v +' + +_ +o +6 +e +7 +5 +p +l +u +m +t +9 diff --git a/full_models/lzz/D_100000.pth b/full_models/lzz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..601ae4521f2e8dd3a167edce6de6dcb5e7cd6ab9 --- /dev/null +++ b/full_models/lzz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d27ea97bc16d9b7fdc0539b715e36c8e1fcf9ecff9a81c9255d82bb40f0b8b4b +size 561076073 diff --git a/full_models/lzz/G_100000.pth b/full_models/lzz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..627ade52bfb85c62a027afbd52f3244d1dbd15e3 --- /dev/null +++ b/full_models/lzz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ce0b773526b54d450aef502d4195cb77a98b7ae552d9545e8bf45a291bf0ee +size 436350500 diff --git a/full_models/lzz/config.json b/full_models/lzz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/lzz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/lzz/vocab.txt b/full_models/lzz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..008799599bae4bfcf8090ac1f95a4c3982ab620d --- /dev/null +++ b/full_models/lzz/vocab.txt @@ -0,0 +1,34 @@ +d +n +ğ +k +̇ +' +ş +ç +z +̆ +b +a +y +_ +s +m +e +x +u +o +f +i +p +t +h +r +c +g +j +v +l + +ʒ +- diff --git a/full_models/maa-dialect_sanantonio/D_100000.pth b/full_models/maa-dialect_sanantonio/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..85c773a4c28d8d6cf1f5dcd42e958569d6a44c21 --- /dev/null +++ b/full_models/maa-dialect_sanantonio/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c02166403667a9045c4753d6489388d923f820ab268b2e5a9e120dca3f9e8a +size 561076191 diff --git a/full_models/maa-dialect_sanantonio/G_100000.pth b/full_models/maa-dialect_sanantonio/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e8ee56949e757ddd7cbaf9a44a0f624509498847 --- /dev/null +++ b/full_models/maa-dialect_sanantonio/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740eb90f803a55f9ba11987ad571591b80747739add566025db52f11a106b51d +size 436369736 diff --git a/full_models/maa-dialect_sanantonio/config.json b/full_models/maa-dialect_sanantonio/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/maa-dialect_sanantonio/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/maa-dialect_sanantonio/vocab.txt b/full_models/maa-dialect_sanantonio/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cec86094b5809d394975c3062fb83f30f1453eb7 --- /dev/null +++ b/full_models/maa-dialect_sanantonio/vocab.txt @@ -0,0 +1,42 @@ +| +a +n +̱ +i +j +t +k +s +o +' +‐ +í +á +g +r +e +l +m +ì +x +h +c +d +y +é +ò +è +à +ñ +ó +b +u +f +ú +p +- +v +z +q +ù + diff --git "a/full_models/maa-dialect_sanjer\303\263nimo/D_100000.pth" "b/full_models/maa-dialect_sanjer\303\263nimo/D_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..b6943bd7ac2befba3ace7ceb3b2213f6aeff5db9 --- /dev/null +++ "b/full_models/maa-dialect_sanjer\303\263nimo/D_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea1f785d27b2b70be92c69537efe89c63dcbfd6b8003172120585431a5adfdaf +size 561078373 diff --git "a/full_models/maa-dialect_sanjer\303\263nimo/G_100000.pth" "b/full_models/maa-dialect_sanjer\303\263nimo/G_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..ba69a664dcf05556e66246ecd19975cbd60d1741 --- /dev/null +++ "b/full_models/maa-dialect_sanjer\303\263nimo/G_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9728b97b55a3ea81fffc4f9185024fbcf32070638237ec3b20edd62c6e077e9 +size 436385090 diff --git "a/full_models/maa-dialect_sanjer\303\263nimo/config.json" "b/full_models/maa-dialect_sanjer\303\263nimo/config.json" new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ "b/full_models/maa-dialect_sanjer\303\263nimo/config.json" @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git "a/full_models/maa-dialect_sanjer\303\263nimo/vocab.txt" "b/full_models/maa-dialect_sanjer\303\263nimo/vocab.txt" new file mode 100755 index 0000000000000000000000000000000000000000..b4b68d48ce61253c17ac450850b154a1ccd4cf10 --- /dev/null +++ "b/full_models/maa-dialect_sanjer\303\263nimo/vocab.txt" @@ -0,0 +1,41 @@ +| +a +n +̱ +i +j +k +t +o +s +' +‐ +e +x +g +í +ì +á +à +l +ò +m +h +c +d +è +y +é +ñ +r +ó +b +u +ú +f +p +z +v +q +- + diff --git a/full_models/mad/D_100000.pth b/full_models/mad/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..beec3fa31294b63d927bc2be2948ad5b4aa5f4ed --- /dev/null +++ b/full_models/mad/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b2b2f87d02494ac2887b07bf95284ff5a223a5b743fc9a6a685b6f2572720a +size 561078599 diff --git a/full_models/mad/G_100000.pth b/full_models/mad/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ea4e7993ab5d23c61d5533ea41cf02abd2669b07 --- /dev/null +++ b/full_models/mad/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2e9c7f57320c0d16739e73904136ebb27969eb8815f69fde49267a85eb89b6 +size 436369186 diff --git a/full_models/mad/config.json b/full_models/mad/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mad/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mad/vocab.txt b/full_models/mad/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..af7e7ebaf4bdde0c0bf79d8caae99e66bfe2904a --- /dev/null +++ b/full_models/mad/vocab.txt @@ -0,0 +1,34 @@ +a +| +n +e +s +g +r +o +k +l +b +d +t +p +i +m +' +h +u +y +j +- +c +w +f +z +â +– +ä +0 +3 +ë +2 + diff --git a/full_models/mag/D_100000.pth b/full_models/mag/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0aaab2735b9d9da3754a1923d1f5ebd213f58b34 --- /dev/null +++ b/full_models/mag/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690e426aa9ab0109c00685bbf0de91c6e27c29f4d37506567c0b4f88393a286d +size 561078980 diff --git a/full_models/mag/G_100000.pth b/full_models/mag/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5888108ed63eb090d0d40d3ad79bef328f38c0c1 --- /dev/null +++ b/full_models/mag/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6686abb36980c8e227a2344a4f24ce213787b899c9280e347a0220a79e183c0 +size 436454086 diff --git a/full_models/mag/config.json b/full_models/mag/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mag/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mag/vocab.txt b/full_models/mag/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f9c819b32ffbc9d7fc1a0fea288887d96ecdbc40 --- /dev/null +++ b/full_models/mag/vocab.txt @@ -0,0 +1,69 @@ +आ +े +ड +ञ +– +स +म +च +प +ब +ी +घ +ँ +औ +ॅ +ट +ख +छ +ण +ि +ऽ +ʻ +2 +् +भ +र +़ +ल +ै +ह +ओ +ं +झ +द +ʼ +_ +ो +ऐ +ढ +ज +अ +è +‍ +ा +व +उ +ु +ष +ऩ +à +ध +ग +त +क +ौ +ई +ए +ठ +य +न +श +ऱ +ऊ +ू +फ +इ +- + +थ diff --git a/full_models/mah/D_100000.pth b/full_models/mah/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81fafb1bc87888a2b0d5674d25a84357fec2cb9c --- /dev/null +++ b/full_models/mah/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cd1971b5359c9d05d010df70d4f4c270f6f7d12869a26e4a199dfb3f382fa50 +size 561078985 diff --git a/full_models/mah/G_100000.pth b/full_models/mah/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aefda79934887fff04da12edc6f65ee5eb8e97e7 --- /dev/null +++ b/full_models/mah/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd29847050f9d0a7a0a8fc0bd6b3d2b746a3a5d5bfa7df4883cbbaea8919735c +size 436381506 diff --git a/full_models/mah/config.json b/full_models/mah/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mah/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mah/vocab.txt b/full_models/mah/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..527e6b9fbabb2f49608655ad54ecc730ed459639 --- /dev/null +++ b/full_models/mah/vocab.txt @@ -0,0 +1,38 @@ +| +e +a +i +n +k +j +o +r +m +ō +l +t +w +b +ṃ +ñ +ā +p +ḷ +u +ọ +d +s +ṇ +ū +y +g +v +z +h +f +' +- +x +c +q + diff --git a/full_models/mai/D_100000.pth b/full_models/mai/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c0b1da5869e4f4a3a9174303a21a31680766ccae --- /dev/null +++ b/full_models/mai/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c18cd2ec6e0a3f2ef2101e7122cf067af0fb5bd554f4e9493ebec048e9003fb +size 561079213 diff --git a/full_models/mai/G_100000.pth b/full_models/mai/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..502f74b5372ee5bc0f51b53c5dbbcfeca2b43665 --- /dev/null +++ b/full_models/mai/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9659877802e061566258f9a0f5b20b450b9fbb68997dcde4f8a0bd28e5f659e +size 436448299 diff --git a/full_models/mai/config.json b/full_models/mai/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mai/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mai/vocab.txt b/full_models/mai/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3e4cf7214b4e631e9b2686ca6de56a55e44b9c1f --- /dev/null +++ b/full_models/mai/vocab.txt @@ -0,0 +1,66 @@ +| +ा +क +र +ि +ह +े +स +न +् +त +ल +म +प +ँ +‍ +भ +ज +ु +अ +य +ब +ी +द +व +छ +ो +श +ग +आ +ओ +ै +ऽ +ू +ख +थ +ए +च +ध +ट +ष +- +ड +़ +ण +इ +ं +उ +औ +ई +ौ +ठ +फ +ृ +घ +ढ +झ +ञ +— +ऊ +ऐ +ः +' +ङ +ऋ + diff --git a/full_models/maj/D_100000.pth b/full_models/maj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a384787c687e5605e6f649e2fbed95a84e7791da --- /dev/null +++ b/full_models/maj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a4f3e4e4a7ef647064574ab40890212fdfab2f3824298fde171ce91785b2e0 +size 561078581 diff --git a/full_models/maj/G_100000.pth b/full_models/maj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7fd3de3a7369957e22e0dfacc0eab1ea3ea56281 --- /dev/null +++ b/full_models/maj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e43bf334460af2ebc118ea349b7031b10875ad92afb9c3f1c54a15ee8ec0afa2 +size 436373692 diff --git a/full_models/maj/config.json b/full_models/maj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/maj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/maj/vocab.txt b/full_models/maj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2b09dee6e2d47c116fe68dac3ca4716f937d0333 --- /dev/null +++ b/full_models/maj/vocab.txt @@ -0,0 +1,36 @@ + +u +m +r +p +s +o +v +l +— +y +j +h +g +ú +n +i +e +' +a +k +x +z +c +_ +d +í +á +f +ó +é +̱ +ṉ +t +ñ +b diff --git a/full_models/mak/D_100000.pth b/full_models/mak/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7683937eb35e99d68e6451ccff25a72f64c4990 --- /dev/null +++ b/full_models/mak/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421098ade5fef5cdabe532abd823cee0bef15d49ea5e8884518aa49e942b3296 +size 561078619 diff --git a/full_models/mak/G_100000.pth b/full_models/mak/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7fed6a5b8855f0092dba1081e42996486524ce0 --- /dev/null +++ b/full_models/mak/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf521af63efa97ee7772013b33b9aaf71cc54d5f5b6319456950928d5296b03 +size 436362072 diff --git a/full_models/mak/config.json b/full_models/mak/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mak/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mak/vocab.txt b/full_models/mak/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..79f6ee1ab2c0ff959b2c924fe6451fcf858659ec --- /dev/null +++ b/full_models/mak/vocab.txt @@ -0,0 +1,31 @@ +a +| +n +i +g +k +m +l +t +u +e +r +s +' +o +p +b +j +y +- +d +c +h +w +f +z +0 +4 +1 +2 + diff --git a/full_models/mal/D_100000.pth b/full_models/mal/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..630ffe1aa8165d2cd706f480629e57f228e266a1 --- /dev/null +++ b/full_models/mal/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8753cf464b97a369acf148453e498959aa8d09ff958720fe1484eda22fb898 +size 561110626 diff --git a/full_models/mal/G_100000.pth b/full_models/mal/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..209298481b80b5cc123d6c9d649a618ce5ea141c --- /dev/null +++ b/full_models/mal/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94043650c6010e925e5d2361e49637c991000cd789982af02a9fb30002ef9f4e +size 436724906 diff --git a/full_models/mal/config.json b/full_models/mal/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mal/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mal/vocab.txt b/full_models/mal/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..01c840400688a5696f66e6de0458f3798d001e96 --- /dev/null +++ b/full_models/mal/vocab.txt @@ -0,0 +1,84 @@ +— +ത +ര +ള +ഴ +ഒ +0 +ൂ +ഖ +ഞ +ഇ +ഡ +ി +ഊ +ച +ാ +യ +ഷ +i +ഉ +ഫ +ല +ഠ +4 +െ +ൗ +ആ +സ +ു +ം +m +ജ +ധ +- +ഹ +ഛ +് +ട +ഃ +ഗ +ണ +ൽ +ോ +_ +റ +ഏ +6 +എ +ർ +ഥ +ഘ +ഓ +ീ +ൈ +2 +േ +ക +1 +ൾ +ങ +ഭ + +ഢ +അ +മ +ബ +3 +ഈ +ഔ +പ +ൺ +ന +ൊ +o +ൃ +c +വ +ൻ +ദ +5 +ഐ +' +q +ശ diff --git a/full_models/mam-dialect_central/D_100000.pth b/full_models/mam-dialect_central/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b5a52610ae05adc2421f81ea74373e22cd15a6b --- /dev/null +++ b/full_models/mam-dialect_central/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a58201ccbe3d9eba1d2887a731a0d53d31b23f97c0952985d4c46049c590128 +size 561077830 diff --git a/full_models/mam-dialect_central/G_100000.pth b/full_models/mam-dialect_central/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..483938685b960eb0eced6ac01e34bd73f0affa40 --- /dev/null +++ b/full_models/mam-dialect_central/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904f323dfbf3dcb7a4a9c1c487fec1bf0b77b41ac225a7807fc46f184ca7f11d +size 436383100 diff --git a/full_models/mam-dialect_central/config.json b/full_models/mam-dialect_central/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mam-dialect_central/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mam-dialect_central/vocab.txt b/full_models/mam-dialect_central/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..45961075f7d4ad8a17963dfd050ec4b333b0b3bd --- /dev/null +++ b/full_models/mam-dialect_central/vocab.txt @@ -0,0 +1,44 @@ +| +t +' +i +n +a +j +e +k +l +y +u +o +x +q +b +m +z +w +s +c +h +p +d +r +- +ú +g +ẍ +é +í +f +v +á +ó +0 +6 +4 +1 +5 +2 +3 +ñ + diff --git a/full_models/mam-dialect_northern/D_100000.pth b/full_models/mam-dialect_northern/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a5cb6a7d7769b4f5fffdcfcb953f38a0361caf06 --- /dev/null +++ b/full_models/mam-dialect_northern/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfac802e79b4bb941b1fc42e7da534e0d8e4005753682c5e5fbf4e18ecc029c +size 561077719 diff --git a/full_models/mam-dialect_northern/G_100000.pth b/full_models/mam-dialect_northern/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa3c51bc0852617f99982afa939a8e18a3cf22e8 --- /dev/null +++ b/full_models/mam-dialect_northern/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d31c4c087d134a7e575a338d0bfcbe1aab5f6287bacf9fff2451bf1c2bb6ef +size 436392595 diff --git a/full_models/mam-dialect_northern/config.json b/full_models/mam-dialect_northern/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mam-dialect_northern/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mam-dialect_northern/vocab.txt b/full_models/mam-dialect_northern/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..375bfc9eadf099d23c9793b318d69339c55121cf --- /dev/null +++ b/full_models/mam-dialect_northern/vocab.txt @@ -0,0 +1,48 @@ +| +t +a +n +e +i +ꞌ +c +j +u +l +y +x +o +k +m +b +z +s +w +p +h +r +d +q +- +ú +— +g +ẍ +é +ó +v +í +á +f +ñ +0 +4 +2 +3 +9 +5 +6 +7 +8 +1 + diff --git a/full_models/mam-dialect_southern/D_100000.pth b/full_models/mam-dialect_southern/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f1c22df487a31d9f45e772e752e20c1818a434e --- /dev/null +++ b/full_models/mam-dialect_southern/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93de8eee15e85045cc8eb592ccd0a749890563787d28465a38c00cbb4decd3ee +size 561078120 diff --git a/full_models/mam-dialect_southern/G_100000.pth b/full_models/mam-dialect_southern/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..04b383d85aa6dc1cbfe7e8d9f7793867d5e34bb1 --- /dev/null +++ b/full_models/mam-dialect_southern/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00ae3931cb96d9dcb7590e09235be5b18ba025e9d37b249580cac6da5aa5f31 +size 436359981 diff --git a/full_models/mam-dialect_southern/config.json b/full_models/mam-dialect_southern/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mam-dialect_southern/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mam-dialect_southern/vocab.txt b/full_models/mam-dialect_southern/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3c76217841f35d86482c4e35a02d1e29117a3fc2 --- /dev/null +++ b/full_models/mam-dialect_southern/vocab.txt @@ -0,0 +1,32 @@ +| +' +t +a +n +e +i +j +u +k +l +x +y +o +q +b +m +z +s +w +c +h +p +d +r +- +— +ẍ +g +ú +́ + diff --git a/full_models/mam-dialect_western/D_100000.pth b/full_models/mam-dialect_western/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8186082e95307684e6b806514c57dd4db8cef8a8 --- /dev/null +++ b/full_models/mam-dialect_western/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab340002cce628cef2f705aed2d87722cef0b06e32c20fe8c44bc5787a5c1d9 +size 561077947 diff --git a/full_models/mam-dialect_western/G_100000.pth b/full_models/mam-dialect_western/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bd348454ea154ff0f975c7209883c4f91d069473 --- /dev/null +++ b/full_models/mam-dialect_western/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5869a5abbc3b9890ef566af6fe4e80cdd4f66c53f4f4e24724cff12865b7f06 +size 436372804 diff --git a/full_models/mam-dialect_western/config.json b/full_models/mam-dialect_western/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mam-dialect_western/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mam-dialect_western/vocab.txt b/full_models/mam-dialect_western/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6d6cdea952763424c91accbfb227d817aa182c6f --- /dev/null +++ b/full_models/mam-dialect_western/vocab.txt @@ -0,0 +1,39 @@ +| +t +a +n +i +e +' +j +c +l +x +y +u +o +k +b +s +z +m +w +p +d +r +h +- +̈ +ú +q +— +í +g +é +á +ẍ +ó +f +v +ñ + diff --git a/full_models/maq/D_100000.pth b/full_models/maq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9124c02292ad5500bd53354b3def59697b53043a --- /dev/null +++ b/full_models/maq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80f17d4403bfa5f51661fd995e9771698fae77a7dcab001abe0a07b7bc25c662 +size 561076148 diff --git a/full_models/maq/G_100000.pth b/full_models/maq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..750ba42ce1dbbfa7c6e312badf057717fc75d5fc --- /dev/null +++ b/full_models/maq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d1cc51901994723662449e18c2ca13397b5cba580c823291dfdb4c8407ac4b7 +size 436352602 diff --git a/full_models/maq/config.json b/full_models/maq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/maq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/maq/vocab.txt b/full_models/maq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c517e573f567ad4bd522d9d7215f09eabb7ce830 --- /dev/null +++ b/full_models/maq/vocab.txt @@ -0,0 +1,35 @@ +d +_ +í +v +t +b +h +g +y +́ +z +ó +l + +p +n +s +é +ú +o +e +m +a +u +ñ +i +c +á +x +ë +r +j +‍ +q +f diff --git a/full_models/mar/D_100000.pth b/full_models/mar/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee76ed76b5bb0e24c7d0b2e2a748342ae34cde6e --- /dev/null +++ b/full_models/mar/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a46d539626f4f406696f06c40eae0d903ef215662b285f1fde01fd0d61d4b4ae +size 561110146 diff --git a/full_models/mar/G_100000.pth b/full_models/mar/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..07c8700036a5363b75b66290f40a7451d8b8733d --- /dev/null +++ b/full_models/mar/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db72854bed82dfb13589f9b37cc2ce2a9dc257e8b9f22dcbe73dd3e2445deb48 +size 436699461 diff --git a/full_models/mar/config.json b/full_models/mar/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mar/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mar/vocab.txt b/full_models/mar/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..bc36bbec8bce5faf235e5fdfbcadc0a24c81fda6 --- /dev/null +++ b/full_models/mar/vocab.txt @@ -0,0 +1,73 @@ +ङ +ह +आ +ब +ढ +ख +2 +ं +त +ट +_ +स +ऊ +1 +क +औ +ळ +च +ओ +- +ई +श +ज +ृ +ग +झ +ʈ +ऐ +द + +ड +ए +ै +ौ +9 +7 +ठ +ऱ +व +ो +ऋ +0 +4 +य +6 +ः +ल +ध +प +ञ +फ +उ +न +ष +म +छ +े +ि +ण +' +अ +इ +ा +ु +ू +ʇ +ऴ +घ +् +र +भ +ी +थ diff --git a/full_models/maw/D_100000.pth b/full_models/maw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b36a129bdc515e2822670a344de31960054bac27 --- /dev/null +++ b/full_models/maw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5882198274e16d35c92286e8613130a75c4baec6ee85ce3d0d50f2331e8cf1d8 +size 561078705 diff --git a/full_models/maw/G_100000.pth b/full_models/maw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be7fa855189ee629938c64f80145d783358e0ea8 --- /dev/null +++ b/full_models/maw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc57e8c5061586428b5022742854cc8b31813ecaf30ce166f3ce773ae7a6726b +size 436359850 diff --git a/full_models/maw/config.json b/full_models/maw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/maw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/maw/vocab.txt b/full_models/maw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..77a87432389d17060ed28dcd2c59314c3fde7a04 --- /dev/null +++ b/full_models/maw/vocab.txt @@ -0,0 +1,30 @@ +| +a +i +n +u +m +y +b +s +l +k +d +ŋ +t +r +e +ↄ +ɛ +g +- +o +z +p +w +' +h +f +v +ԑ + diff --git a/full_models/maz/D_100000.pth b/full_models/maz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1778cd517c135b9c604edbfe598c999c52b0e367 --- /dev/null +++ b/full_models/maz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:febdead6e410a906459207539cf24bc93cb984bb6933f7b11d113d4ef5402d6d +size 561078601 diff --git a/full_models/maz/G_100000.pth b/full_models/maz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cc0dff48161c88b21d384ed43e64d77b7a135965 --- /dev/null +++ b/full_models/maz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b6b171011398db3002cc9eebb6adf99afd1a4fb383e1c46dd91578d3a6f6eb1 +size 436394331 diff --git a/full_models/maz/config.json b/full_models/maz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/maz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/maz/vocab.txt b/full_models/maz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5ab97ab520e90ac11c07cedaba015f7c3cf6de2c --- /dev/null +++ b/full_models/maz/vocab.txt @@ -0,0 +1,45 @@ +| +a +j +i +e +c +' +o +n +m +u +r +ü +t +s +g +d +y +p +z +ö +b +x +h +ñ +í +̱ +ä +ë +v +ã +l +á +ũ +ó +ṉ +õ +ẽ +ú +f +q +é +ĩ +k + diff --git a/full_models/mbb/D_100000.pth b/full_models/mbb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20f40ce27f187cba6105088b7df2bc9c3f3dac1a --- /dev/null +++ b/full_models/mbb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05eb64e16929e6ea336aafd43583004b48dc9f2eaade45b71629df62952d620c +size 561077872 diff --git a/full_models/mbb/G_100000.pth b/full_models/mbb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ac9abe199f9a458f1e85181c1b9b6ef64777b3e --- /dev/null +++ b/full_models/mbb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec40fe8555ab3854f7223832c4b03f5d57848745bb812f65290618dcbf134e1 +size 436371269 diff --git a/full_models/mbb/config.json b/full_models/mbb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mbb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mbb/vocab.txt b/full_models/mbb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..04ea46b0e8fcbc626ea1d83f83ecc9963bbfc3f3 --- /dev/null +++ b/full_models/mbb/vocab.txt @@ -0,0 +1,35 @@ +| +e +n +a +i +u +t +k +s +m +d +h +g +y +l +w +z +p +b +à +v +ǥ +r +- +è +ù +j +ì +o +' +c +f +x +7 + diff --git a/full_models/mbc/D_100000.pth b/full_models/mbc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..080cf898abb6ba779bef38ed00e27b8f8fd69671 --- /dev/null +++ b/full_models/mbc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8b50261f7433037fd1bae8e2df52bcdb53d5e3d9375401307c389929b171fca +size 561078511 diff --git a/full_models/mbc/G_100000.pth b/full_models/mbc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..26b5f6c0d6e90e148e696757c7ac6d79aaa38fb6 --- /dev/null +++ b/full_models/mbc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d9ea8baaa147289ee7e1ffc0cf2869dea7c1f68b0beed18851a120d0d2b516 +size 436414888 diff --git a/full_models/mbc/config.json b/full_models/mbc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mbc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mbc/vocab.txt b/full_models/mbc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..adb93602fef667f6d449db7f808a7193a486477e --- /dev/null +++ b/full_models/mbc/vocab.txt @@ -0,0 +1,54 @@ +- +k +é +0 +w +h +9 +y +ê +j +z +i +v +â +l +b +p +m +s +í +3 +˼ +5 +_ +t +d +g +c +ô +— +õ +1 +6 +' +n +á +2 + +r +x +a +u +ã +˻ +î +7 +ó +8 +e +4 +f +q +ú +o diff --git a/full_models/mbh/D_100000.pth b/full_models/mbh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0fdcd063a3d9bb237eb70a18e6c0be4673110b87 --- /dev/null +++ b/full_models/mbh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6555a3103b4451f700262fb8b51ad352a46ceab6d31902a06501f2b4bbe264 +size 561078753 diff --git a/full_models/mbh/G_100000.pth b/full_models/mbh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9637752a6df5ac46d1cfb63ddd795bfa22df1f96 --- /dev/null +++ b/full_models/mbh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183cfb2ff7b84680bf8060d029b0a6a76e078f0b2d81b6bec7dc681d991e4b86 +size 436375392 diff --git a/full_models/mbh/config.json b/full_models/mbh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mbh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mbh/vocab.txt b/full_models/mbh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f670b718c8e7921566373915e727d2ace6abc731 --- /dev/null +++ b/full_models/mbh/vocab.txt @@ -0,0 +1,36 @@ +| +a +o +e +n +i +g +l +r +m +t +k +u +v +p +s +h +d +w +j +b +0 +1 +2 +' +3 +5 +4 +6 +8 +9 +7 +- +y +f + diff --git a/full_models/mbj/D_100000.pth b/full_models/mbj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9c0036c1fe1c114c1ea7c6267f06b73fe439895e --- /dev/null +++ b/full_models/mbj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12da637601f072d5cc254ab4415941c3ced515c594d143bebe67a403dd896385 +size 561078601 diff --git a/full_models/mbj/G_100000.pth b/full_models/mbj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0189534eb92ea6c3c325fd85c8bef6b487eb05be --- /dev/null +++ b/full_models/mbj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3867cb3708183048a508563f1fc291bebb2f1041a899f44b090cbf371a70077 +size 436398802 diff --git a/full_models/mbj/config.json b/full_models/mbj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mbj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mbj/vocab.txt b/full_models/mbj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1d5d6c17b4d1fa5f2563feae3f9a10ee0584262a --- /dev/null +++ b/full_models/mbj/vocab.txt @@ -0,0 +1,47 @@ +o +t +s +d +p +0 +9 +y +b +k +̃ +ũ +g +ó +u +h +e + +w +i +é +ä +4 +3 +— +- +j +ã +ë +l +5 +m +6 +a +ẽ +2 +n +r +_ +8 +7 +1 +ǟ +õ +ỹ +ĩ +' diff --git a/full_models/mbt/D_100000.pth b/full_models/mbt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8792b28957c501585d6d6dcaa4d83f051e0241ca --- /dev/null +++ b/full_models/mbt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b9e939064aa75353f76688da4b7ad8c48f2d3c95eca39cf93cbfc21b8923e5b +size 561078627 diff --git a/full_models/mbt/G_100000.pth b/full_models/mbt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b8fe9bb48eb6b88dfec7f24fb8b0de816b55376e --- /dev/null +++ b/full_models/mbt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7496c966268556745087dd4842f2190bd06fab3cb7aaed49f0dbabeb5c67fe5 +size 436359755 diff --git a/full_models/mbt/config.json b/full_models/mbt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mbt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mbt/vocab.txt b/full_models/mbt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d4ba00f9ae63c6e166def4f48a9cbd5602c459eb --- /dev/null +++ b/full_models/mbt/vocab.txt @@ -0,0 +1,30 @@ +| +e +a +n +i +u +k +t +g +m +s +y +d +l +p +w +r +h +b +- +— +' +0 +6 +2 +3 +1 +5 +4 + diff --git a/full_models/mbu/D_100000.pth b/full_models/mbu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9a3619ef92a983c286d99a03dc67450afaee606f --- /dev/null +++ b/full_models/mbu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf2bfa5427254b2ffe1f49d1e7dbef0ba5a602083f3736036e4a963ec1a8dde +size 561079373 diff --git a/full_models/mbu/G_100000.pth b/full_models/mbu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f195714a859c582d2c0861e5e73aa381b9797b72 --- /dev/null +++ b/full_models/mbu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac014753498bdbadc9ec38dac4e8be0fe07f59ab651c3e772cd5799ce34c5b5f +size 436434264 diff --git a/full_models/mbu/config.json b/full_models/mbu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mbu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mbu/vocab.txt b/full_models/mbu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..26ee7eac61ad8adbd26a3dd1d804ca7230d03c44 --- /dev/null +++ b/full_models/mbu/vocab.txt @@ -0,0 +1,61 @@ +ě +ǝ +ê +n +é +ú +c +y +h +v +2 +́ +g + +d +p +â +û +- +l +k +á +í +t +ì +ū +i +î +ô +̀ +ó +è +r +s +a +_ +z +0 +b +ŋ +ǎ +ɓ +1 +ā +j +ò +f +6 +ɗ +w +ǔ +e +m +ǒ +u +4 +o +à +' +ə +ù diff --git a/full_models/mbz/D_100000.pth b/full_models/mbz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1a43006b17aff5249cd917d0fb75367615de8ef9 --- /dev/null +++ b/full_models/mbz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc952d6bda3f3d6834fc2e779633910dfcb3768cf34c38279929f499ad81dfdc +size 561075950 diff --git a/full_models/mbz/G_100000.pth b/full_models/mbz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bdab29f0ba41f315c2382a8f37f1ccd2f8b52991 --- /dev/null +++ b/full_models/mbz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2aa5924f374127b0cdb7c8cb083e44ba6efa0db22dcaecb78540497ae0a822d +size 436349651 diff --git a/full_models/mbz/config.json b/full_models/mbz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mbz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mbz/vocab.txt b/full_models/mbz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8f705c508e67a4bb044a5ec8d4e90bb127481223 --- /dev/null +++ b/full_models/mbz/vocab.txt @@ -0,0 +1,34 @@ +| +a +n +i +u +t +k +ꞌ +- +o +r +y +c +h +s +ɨ +v +e +ñ +w +j +m +x +g +— +l +p +í +d +f +b +é +ó + diff --git a/full_models/mca/D_100000.pth b/full_models/mca/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6486fa18edf38699f08f040fab08b962765d4500 --- /dev/null +++ b/full_models/mca/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bdf2d5fb2ba0334cdfbae272cc5a1379e923ec6382bce76000c3c6022f99c1a +size 561078218 diff --git a/full_models/mca/G_100000.pth b/full_models/mca/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4a7289aae2eec03c851ebc1c9a65ed74c5bed0f9 --- /dev/null +++ b/full_models/mca/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21b112b94937a311c45edcbb6a86ff30b3d3c92431eb14715cc3a1111199739 +size 436389685 diff --git a/full_models/mca/config.json b/full_models/mca/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mca/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mca/vocab.txt b/full_models/mca/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f6c919e4e1bdc77510cae6124a2ba7c842931942 --- /dev/null +++ b/full_models/mca/vocab.txt @@ -0,0 +1,43 @@ +| +i +e +a +ˈ +t +n +j +' +k +q +s +h +u +ƚ +y +p +w +m +l +o +x +f +r +— +d +c +ú +b +g +í +é +ó +z +á +v +- +ñ +1 +4 +0 +3 + diff --git a/full_models/mcb/D_100000.pth b/full_models/mcb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d8adf1841f6d8602e571126b2d436c76737cc2ba --- /dev/null +++ b/full_models/mcb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:795bc98c81f7601ab4786e61d0987df817c8d8f9ddc28fccebebe96bddf255d5 +size 561078726 diff --git a/full_models/mcb/G_100000.pth b/full_models/mcb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ad51c284bde3dc80b43886b2bd2fc46944d77b98 --- /dev/null +++ b/full_models/mcb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56552d19abd1b0e7a768082acc5c6ad7af2590346a0a0b7a95927b99b9f085e6 +size 436366793 diff --git a/full_models/mcb/config.json b/full_models/mcb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mcb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mcb/vocab.txt b/full_models/mcb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6a6f818397e8edd31ba99a8b5d72d25852f14952 --- /dev/null +++ b/full_models/mcb/vocab.txt @@ -0,0 +1,33 @@ +a +i +| +r +t +k +n +e +o +g +s +m +p +v +y +h +u +ñ +c +j +— +0 +1 +' +2 +4 +7 +5 +3 +6 +8 +9 + diff --git a/full_models/mcd/D_100000.pth b/full_models/mcd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff94eb00a9b905a536f98b7b224336050b10b235 --- /dev/null +++ b/full_models/mcd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c62692cd23d701ff4b0b48551038602364b19fc344a88b190db938a00c3e74 +size 561078722 diff --git a/full_models/mcd/G_100000.pth b/full_models/mcd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eb128ab99be297c24d0b1f9372f7b29fe9c73f2a --- /dev/null +++ b/full_models/mcd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191d783dcc4952a53374e8247b8e36b2daee4f368faef57a1e6c1c38316ee413 +size 436385073 diff --git a/full_models/mcd/config.json b/full_models/mcd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mcd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mcd/vocab.txt b/full_models/mcd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c45f7f4a4799f9f924573d279374786b65bcd749 --- /dev/null +++ b/full_models/mcd/vocab.txt @@ -0,0 +1,41 @@ +6 +c +z + +4 +e +f +o +r +v +i +ú +2 +k +b +é +u +_ +ó +' +a +d +m +á +t +q +7 +j +1 +0 +n +s +y +h +p +— +l +x +g +í +ñ diff --git a/full_models/mco/D_100000.pth b/full_models/mco/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b482b2bf69152b37ce7f15c3db5014dc6a54fbb5 --- /dev/null +++ b/full_models/mco/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b5f46d7643f38cb66a32f5e074271ba20974b362211ab87b00fad531b69ddcd +size 561078618 diff --git a/full_models/mco/G_100000.pth b/full_models/mco/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..31719d1b6074d7ef3110703080d19092288e1d4c --- /dev/null +++ b/full_models/mco/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59307fb047893282a5e9475d1a530d0b859741ac1c1852a348638e52b0af9d6 +size 436389588 diff --git a/full_models/mco/config.json b/full_models/mco/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mco/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mco/vocab.txt b/full_models/mco/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ffb17e3934c1aa54c3689ee334dabbb36dad95cc --- /dev/null +++ b/full_models/mco/vocab.txt @@ -0,0 +1,43 @@ +x +d +b +z +ë +l +ú +ñ +a +u +ó +ä +̈ +ö +ï +f +p +é +c +e +- +q +n +_ +ü +r +y +i +m +g +o +v +í +t +' +́ +á +ɨ +s +h + +k +j diff --git a/full_models/mcp/D_100000.pth b/full_models/mcp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..362261ad838db7d4e1797e5aa4f51d069b578b83 --- /dev/null +++ b/full_models/mcp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f61169bccbd30dc89d9123af325bd9b52f11552268d3a211f3d22591e00edbe +size 561078997 diff --git a/full_models/mcp/G_100000.pth b/full_models/mcp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..04039a7890957794918fcbf5aac17a209ed1f680 --- /dev/null +++ b/full_models/mcp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a1273f03c5c4486a08ed0468eb651a249d3782d6c7a7ee7e2c517df57efbca2 +size 436411407 diff --git a/full_models/mcp/config.json b/full_models/mcp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mcp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mcp/vocab.txt b/full_models/mcp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7d4c39a2ec3db974f33bbe33adf9a7d3be6f87ec --- /dev/null +++ b/full_models/mcp/vocab.txt @@ -0,0 +1,51 @@ +j +o +u +t +î +ʉ +á +g +r +k +ɛ +̧ +é +ú +û +ê +ǒ +ə +ǎ +l +_ +f +h +ɔ +̌ +b +p +ɨ +̂ +c +ô +- +â +z +i +ŋ +s + +w +a +d +í +ǐ +v +́ +y +ó +n +e +ǔ +m diff --git a/full_models/mcq/D_100000.pth b/full_models/mcq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be2e418eece7350bc015a33106c75d3d819c8788 --- /dev/null +++ b/full_models/mcq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff9b28e28295550a472e21b06a7c9a039b857746ad9cce89fe37580809457303 +size 561079095 diff --git a/full_models/mcq/G_100000.pth b/full_models/mcq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..37d8d280ac2c428e20613a744159ef601172dd83 --- /dev/null +++ b/full_models/mcq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0786f94a0321014a0f6a0e37fba7843f3fec92cc1b8167da3ad5d429901addea +size 436371866 diff --git a/full_models/mcq/config.json b/full_models/mcq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mcq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mcq/vocab.txt b/full_models/mcq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..626377903b34c2d4d72c549b725b2ba8fe40c060 --- /dev/null +++ b/full_models/mcq/vocab.txt @@ -0,0 +1,34 @@ +p +d +j +é +á +o +r +' +t + +g +5 +n +e +h +7 +i +k +ú +0 +- +a +m +w +2 +v +1 +3 +s +u +í +c +_ +6 diff --git a/full_models/mcu/D_100000.pth b/full_models/mcu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b4fc27b3ae9ad97ea3fb0dd6b75408e2160dd233 --- /dev/null +++ b/full_models/mcu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83c6d147723f1e857a2bfcfee26223d5c1cd56301344f0586d34fc303753af8 +size 561078739 diff --git a/full_models/mcu/G_100000.pth b/full_models/mcu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..21db7140849c6de6a65d6712d3541de523ffde80 --- /dev/null +++ b/full_models/mcu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b958d4c43cd130728527fb096a7f296e401b3836061c3f7c63066722913a256a +size 436427722 diff --git a/full_models/mcu/config.json b/full_models/mcu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mcu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mcu/vocab.txt b/full_models/mcu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6a755af222dd2f7039bf9798915a76219efa0bef --- /dev/null +++ b/full_models/mcu/vocab.txt @@ -0,0 +1,58 @@ +| +n +é +e +ɔ +b +m +a +è +d +l +s +à +y +t +g +k +ŋ +h +i +́ +á +r +u +ò +̀ +í +w +c +o +â +j +ù +ú +f +ê +ì +ó +v +ô +î +̂ +- +` +p +û +1 +2 +3 +5 +4 +' +7 +6 +9 +8 +0 + diff --git a/full_models/mda/D_100000.pth b/full_models/mda/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b9402a264e49e8de0876cbf98dfc81badf124b79 --- /dev/null +++ b/full_models/mda/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f37aa74a243193c8a088971ef1b901f051ef5a3cd385fa4c8afdf23fcbc7e3b7 +size 561078625 diff --git a/full_models/mda/G_100000.pth b/full_models/mda/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..29a62de4b44498ecd5e6b97d048cc7c04089c549 --- /dev/null +++ b/full_models/mda/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56eaeaffeef2f350b26fbc0a60ef6301cfba398348cd6e2c2f9d6fda214f0af1 +size 436419636 diff --git a/full_models/mda/config.json b/full_models/mda/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mda/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mda/vocab.txt b/full_models/mda/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ca351e11fac9ac750a90efed44deaf9498b44bf5 --- /dev/null +++ b/full_models/mda/vocab.txt @@ -0,0 +1,56 @@ +| +ə +n +̄ +y +g +m +k +ē +s +̀ +r +b +a +d +ā +t +w +l +u +ɛ +e +à +ɔ +ì +i +p +ū +o +z +ī +è +h +ù +j +c +̆ +v +f +̂ +ō +ò +ŭ +ĕ +ă +â +- +ĭ +ê +û +ô +î +é +ŏ +` + diff --git a/full_models/mdv/D_100000.pth b/full_models/mdv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..43842bbc3d1fb2576156b35a4a50e72351fccc78 --- /dev/null +++ b/full_models/mdv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dec0b21196413a8194032f766c0bdac2905fd761f33dfed88b571720626ee1c +size 561076022 diff --git a/full_models/mdv/G_100000.pth b/full_models/mdv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..65ad237537436d4aac23908241f516c801a27490 --- /dev/null +++ b/full_models/mdv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2754832ca8531a629407bfefb520abd48d4cdd5316925c2297fb870d28fab67b +size 436359092 diff --git a/full_models/mdv/config.json b/full_models/mdv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mdv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mdv/vocab.txt b/full_models/mdv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..04ea7e01a2cf0b95a725b419ef4e7e30a5cf9ffa --- /dev/null +++ b/full_models/mdv/vocab.txt @@ -0,0 +1,38 @@ +— +j +r +o +̱ +_ +k +x +ñ +n +v +c +a +í +b +m +ú +f +e +g +l +z + +́ +s +t +y +d +p +ó +ɨ +h +ꞌ +- +á +i +é +u diff --git a/full_models/mdy/D_100000.pth b/full_models/mdy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c57a6d57d1a5480150413a2d28eb8705569e8768 --- /dev/null +++ b/full_models/mdy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d2dcab6439d6da76fc3c1b012631b61a89872ccf1f8aed0cfb6c73d00cc021 +size 561079119 diff --git a/full_models/mdy/G_100000.pth b/full_models/mdy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8be43f71557b4743c8d3d3c990affea1ccec4ca2 --- /dev/null +++ b/full_models/mdy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d932c3e4fdb3c63c0f8292ff73fb6adac06c6bae0ac489a6a6ea1a813e0256f3 +size 436648193 diff --git a/full_models/mdy/config.json b/full_models/mdy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mdy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mdy/vocab.txt b/full_models/mdy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..99302b7a3640e835147ed96e4a00d782f1167486 --- /dev/null +++ b/full_models/mdy/vocab.txt @@ -0,0 +1,153 @@ +| +ን +ዓ +ሢ +ና +ዒ +ማ +ያ +ይ +ኣ +ዳ +ታ +ዔ +ኔ +ኮ +ቴ +ዛ +ጌ +ሃ +ኬ +ር +ካ +ሲ +ፆ +ባ +ሴ +ዬ +ቶ +ም +ጎ +ጋ +ላ +ዋ +ኤ +ዎ +ኦ +ፓ +ጉ +ዖ +ሮ +ኪ +ጊ +ዲ +ኒ +ሳ +ዴ +ዚ +ፔ +ሣ +ሙ +ቢ +ዻ +ሎ +ኑ +ሪ +ስ +ሶ +ሊ +ሱ +ሺ +ቃ +ቲ +ዶ +ራ +ሚ +ሞ +ቂ +ዞ +ቤ +ሜ +ኢ +ፃ +ኡ +ቄ +ሌ +ዼ +ዑ +ቱ +ዺ +ፒ +ሄ +ፖ +ጮ +ዜ +ጫ +ኖ +ሾ +ቦ +ዱ +ሽ +ሂ +ሼ +ሻ +ኩ +ፂ +ዦ +ል +ው +ዮ +ፑ +ቆ +ሹ +ዾ +ቡ +ሁ +ጴ +ጳ +ቺ +ጪ +ሬ +ቾ +ሩ +ሦ +ዹ +ጲ +ቻ +ቁ +ሉ +ጶ +ፄ +ጬ +ሤ +ዢ +ዙ +ዣ +ብ +ዪ +ዉ +ሡ +ጩ +ዤ +ዌ +ሆ +ሥ +ጂ +ቹ +ቼ +ዊ +ጆ +ፕ +ፁ +ግ +ጄ +ጃ +ዩ +ጱ +ዥ +ክ +ዡ +ዝ +ጁ +ት + diff --git a/full_models/med/D_100000.pth b/full_models/med/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f7242dab625b77c5aaad88da49e78953eaa3f0c3 --- /dev/null +++ b/full_models/med/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4670fe409d6561c48e2ae8e5d185bc41a4697de84e0b9d4e0d26f79d124af40a +size 561078621 diff --git a/full_models/med/G_100000.pth b/full_models/med/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be6d3383c5919d72386d97d1f423066b6ef10a27 --- /dev/null +++ b/full_models/med/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa63a6e84b910a1766b1fbc0490585eb8d8160e1e4f8a05e226d2f833928bd7 +size 436373663 diff --git a/full_models/med/config.json b/full_models/med/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/med/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/med/vocab.txt b/full_models/med/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2fd8a47c2068d111787accc53a1c902d304339f8 --- /dev/null +++ b/full_models/med/vocab.txt @@ -0,0 +1,36 @@ +4 +r +o +- +l +t +8 +2 +7 +u +d +e +m +y +w +_ +g +i +b +6 +ʉ +k +0 +a +ⱡ +' +5 +s +ᵾ +n +1 +p +9 +j +3 + diff --git a/full_models/mee/D_100000.pth b/full_models/mee/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b01854b7a0d39b476ab6f27ac1dfc6a3d87c02ea --- /dev/null +++ b/full_models/mee/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f58a47da10e18da89ba71f5edf9d71bd0ddc70aab385328d82bc41062ff6b4 +size 561076022 diff --git a/full_models/mee/G_100000.pth b/full_models/mee/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..59b2cf3e4474ec45ddb1f6fb50f214df0951fd48 --- /dev/null +++ b/full_models/mee/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fabd8004970d1e43d9d21c3b09247966ccd00980cc4a4e2635e0dda1ee90c593 +size 436329121 diff --git a/full_models/mee/config.json b/full_models/mee/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mee/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mee/vocab.txt b/full_models/mee/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..610fae1bb7126168ec2d0f25f4b64cc82612fb1b --- /dev/null +++ b/full_models/mee/vocab.txt @@ -0,0 +1,25 @@ +5 +p +m +2 +0 +g +e +' +s +_ +n +i +l +t +— +a +b +u +r +o +3 +4 +v + +k diff --git a/full_models/mej/D_100000.pth b/full_models/mej/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..083004b53615b00218298426c1b367c48a84062e --- /dev/null +++ b/full_models/mej/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57f3af8a1d80dc390dd02ec85f89099359afbebde8ac1281215cca45c9a4c81 +size 561078197 diff --git a/full_models/mej/G_100000.pth b/full_models/mej/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..92a7157d2114c3c6ec3a9c5a9a1d7f493c360658 --- /dev/null +++ b/full_models/mej/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659581489326ca488b3be80cdf6d43100bdded69a0a205d652be1452e7aaf617 +size 436364329 diff --git a/full_models/mej/config.json b/full_models/mej/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mej/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mej/vocab.txt b/full_models/mej/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b7fef77267f3c1a31f6eb3ba6b11af2f7bcdf26d --- /dev/null +++ b/full_models/mej/vocab.txt @@ -0,0 +1,32 @@ +w +' +1 +f +t +4 +d +z +2 +k +l +r +p +s +b +i +h +_ +o +j +g +6 +a + +u +y +c +e +n +0 +m +- diff --git a/full_models/men/D_100000.pth b/full_models/men/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6e89fe0e9b490087bc5ccab21715e2804dbe3b44 --- /dev/null +++ b/full_models/men/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0615a1d17189fbba6d6a9369269f4b9b7bad78f5ad76d3813c6f4ade7f365490 +size 561078721 diff --git a/full_models/men/G_100000.pth b/full_models/men/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2748b242a91ffb8f89fc7b121fb89b302ec43759 --- /dev/null +++ b/full_models/men/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d887490a25dd12cc2ac3abf4626df142d5ab502caa146d25e8deeeef6e86816 +size 436363077 diff --git a/full_models/men/config.json b/full_models/men/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/men/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/men/vocab.txt b/full_models/men/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..28d73a40ca9f7c1f8a5389d473c9e1b6112337ef --- /dev/null +++ b/full_models/men/vocab.txt @@ -0,0 +1,31 @@ +| +a +i +n +e +l +g +ɛ +u +ɔ +m +w +y +t +k +o +b +h +s +p +d +j +v +f +r +- +ŋ +z +' +c + diff --git a/full_models/meq/D_100000.pth b/full_models/meq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf1d2db49802183a8a48dbb243b2f09391fccae2 --- /dev/null +++ b/full_models/meq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e40d39b52fa45fd5bb3a35b6a5fdc7099ce4c98d856a459f58616c86b8bf91 +size 561078639 diff --git a/full_models/meq/G_100000.pth b/full_models/meq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7e5342dc634029002561aae53301cf97979c3604 --- /dev/null +++ b/full_models/meq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcebdd7508b637b533392b2d8803d29a93576641d6bc15e5cab8883d82e249e8 +size 436375894 diff --git a/full_models/meq/config.json b/full_models/meq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/meq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/meq/vocab.txt b/full_models/meq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ec92933a772f4c37f50b721187128651a9bd19b8 --- /dev/null +++ b/full_models/meq/vocab.txt @@ -0,0 +1,37 @@ +| +a +e +y +ə +m +n +t +k +l +h +i +d +w +r +g +s +b +u +o +z +ɗ +ŋ +f +v +p +â +ɓ +ɨ +œ +ʼ +- +0 +4 +3 +2 + diff --git a/full_models/met/D_100000.pth b/full_models/met/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6724b53420188c45f48772715eaa82ab1d8ae042 --- /dev/null +++ b/full_models/met/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10a43c2b0b88fc8dd3288a84e14898c1b3f75a46426ca71b660539b7ab7b7c08 +size 561079248 diff --git a/full_models/met/G_100000.pth b/full_models/met/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20de9c8713bfc5d8d6db8744e80af793e82ef1a9 --- /dev/null +++ b/full_models/met/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a859825181c17e38b08f989b9b631472266c2ef655757b0bc3651e6fb8a08ee3 +size 436378259 diff --git a/full_models/met/config.json b/full_models/met/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/met/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/met/vocab.txt b/full_models/met/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ba4afaf53ecbba492e1e109a1c618f152466ee0d --- /dev/null +++ b/full_models/met/vocab.txt @@ -0,0 +1,36 @@ +1 +_ +- +w +b +p +o +k +8 +y +2 +9 +5 +h +t +g +n +d +0 +4 +r +a +7 +i +s +6 +x +l +e +u +— +3 +ʼ +' + +m diff --git a/full_models/mev/D_100000.pth b/full_models/mev/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..09b456c73823c2c99fecc5203b307daad25ed8af --- /dev/null +++ b/full_models/mev/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71a981ff1c0d8f6c8414824a8ac22ffd1b964ce3e6a6ecc955d238d999601282 +size 561078379 diff --git a/full_models/mev/G_100000.pth b/full_models/mev/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..547f6e59b76372a2d4cac3a27334fafa6453bf67 --- /dev/null +++ b/full_models/mev/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c165a9c487517a636d2add6429aabd6adbabdf6dcb153abe78f1cb0499e2e08a +size 436405836 diff --git a/full_models/mev/config.json b/full_models/mev/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mev/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mev/vocab.txt b/full_models/mev/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9b648dc633667d9d1d46b232132f4ff605a06bca --- /dev/null +++ b/full_models/mev/vocab.txt @@ -0,0 +1,50 @@ +| +ɛ +̀ +l +k +ɔ +à +́ +a +á +m +e +̃ +o +é +w +í +i +g +ì +y +è +z +p +- +ó +n +d +b +ò +s +ɓ +ĩ +t +‐ +ã +ú +ù +f +v +u +ũ +ḿ +ṹ +ƃ +h +ŋ +— +' + diff --git a/full_models/mfe/D_100000.pth b/full_models/mfe/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f0d1599a5446fda36e778fbe7e44315b2ec7fb13 --- /dev/null +++ b/full_models/mfe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b600ae782b8806694478c817b642d9c8bb00894ebde73629df68d62c6c99e018 +size 561078725 diff --git a/full_models/mfe/G_100000.pth b/full_models/mfe/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b30704831fff0c2c0cd5432162559229b492dc26 --- /dev/null +++ b/full_models/mfe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b23fd0e673b21b53827167271bfc39ec817ea920b979017a851fa8e036a0fef +size 436364507 diff --git a/full_models/mfe/config.json b/full_models/mfe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mfe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mfe/vocab.txt b/full_models/mfe/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..72f516167fad6083ee74dbdda1e68612d70d210f --- /dev/null +++ b/full_models/mfe/vocab.txt @@ -0,0 +1,31 @@ +| +n +a +e +i +o +r +t +l +s +k +p +z +m +u +d +b +f +v +w +g +y +- +x +' +0 +h +1 +2 +– + diff --git a/full_models/mfh/D_100000.pth b/full_models/mfh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ac44697177f39ea7e0247f5cf7974ea9a5cd72f2 --- /dev/null +++ b/full_models/mfh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5e47862bb95d8690622aa4da5a0a4204c12b2634a8d561394af5aa9b25d32a +size 561078475 diff --git a/full_models/mfh/G_100000.pth b/full_models/mfh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..76edd01360341e1e5624c5e13141790071f39e35 --- /dev/null +++ b/full_models/mfh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6fdbbfe5359633f689c3113b61061da7d8804079e146e16bc16b26c5577ac8 +size 436380617 diff --git a/full_models/mfh/config.json b/full_models/mfh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mfh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mfh/vocab.txt b/full_models/mfh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..06d7632536be1743b3e395d69e40c2589e359506 --- /dev/null +++ b/full_models/mfh/vocab.txt @@ -0,0 +1,39 @@ +a +| +l +à +k +ə +g +u +m +w +z +s +t +ŋ +y +n +i +h +d +o +b +e +ɗ +v +r +p +f +̀ +ɓ +' +ò +ù +ì +è +- +j +c +1 + diff --git a/full_models/mfi/D_100000.pth b/full_models/mfi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ebfb293fb2d067bb856ef22ff8f3ebf0a5e21acf --- /dev/null +++ b/full_models/mfi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e057ec8e8a7d12a26172bdb9b0f90710e2c2208e5c69b0c131cb5350cbf4b41 +size 561078600 diff --git a/full_models/mfi/G_100000.pth b/full_models/mfi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2d38a488a0f4d674eb7472886ba506593ebb5b9a --- /dev/null +++ b/full_models/mfi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43573e79f6577faee3225d15cea96d8ea16c1136a4961d9cb9f1fce89e510629 +size 436368858 diff --git a/full_models/mfi/config.json b/full_models/mfi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mfi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mfi/vocab.txt b/full_models/mfi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a0cf01c5467046417ec247f2feb7518c29cd31ef --- /dev/null +++ b/full_models/mfi/vocab.txt @@ -0,0 +1,34 @@ +a +| +e +n +á +r +i +m +k +d +t +u +s +y +w +l +b +g +h +ŋ +z +ɗ +- +v +f +p +j +c +ɓ +ƴ +í +ú +ꞌ + diff --git a/full_models/mfk/D_100000.pth b/full_models/mfk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..010244c960dba5bb94e18f2d9366fa5dee04f67a --- /dev/null +++ b/full_models/mfk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee827a2ac6725401b63245ca542d5a7f39f99e45d317563532431b872267e5c1 +size 561079110 diff --git a/full_models/mfk/G_100000.pth b/full_models/mfk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1e1b1eff97e189886a4eb3750b063228e5948dca --- /dev/null +++ b/full_models/mfk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9cfa17138874fbf7e6e9691eee083334483ed4caf83464af3457ae60479f2b8 +size 436368446 diff --git a/full_models/mfk/config.json b/full_models/mfk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mfk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mfk/vocab.txt b/full_models/mfk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7653a62e9a96fde8c2335d696d5bf86f73ee34cf --- /dev/null +++ b/full_models/mfk/vocab.txt @@ -0,0 +1,32 @@ +d +m +ɗ +v +e +s +k +g +n + +l +c +a +o +_ +- +' +z +i +ä +u +h +ŋ +y +r +ə +f +t +b +p +ɓ +w diff --git a/full_models/mfq/D_100000.pth b/full_models/mfq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..89087dbce270c98a10db9e057972ac9a68d5af8a --- /dev/null +++ b/full_models/mfq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2237bd7a7132d0f6278950b9958d82f2f491c392d3b045937bd8de77151d79ef +size 561078875 diff --git a/full_models/mfq/G_100000.pth b/full_models/mfq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..53861081992b2e9074aa4c2630e062803894f697 --- /dev/null +++ b/full_models/mfq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f15dbed3fd90eb1948e337161726c40adf34fcbc52249ea657203fcd64b582a +size 436358899 diff --git a/full_models/mfq/config.json b/full_models/mfq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mfq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mfq/vocab.txt b/full_models/mfq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3aacd6288911574091e7ad0cab37ac9027cbbe82 --- /dev/null +++ b/full_models/mfq/vocab.txt @@ -0,0 +1,28 @@ +| +ɑ +n +i +k +u +b +t +l +e +m +s +y +o +ŋ +d +p +ɔ +' +w +j +f +g +c +a +- +h + diff --git a/full_models/mfy/D_100000.pth b/full_models/mfy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1de51494d63924bcf1216b6df1879c67365414ad --- /dev/null +++ b/full_models/mfy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e072e823cf04ea4397e94d0195a34ccc4605939c2d640348bd8f68e634757f1 +size 561078750 diff --git a/full_models/mfy/G_100000.pth b/full_models/mfy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8d296f85c423ecce83092b0860a4163b608edd41 --- /dev/null +++ b/full_models/mfy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee453661284670cc01f0efefb6f104b75db438c51a46f9b5e04afd55115a71b +size 436390776 diff --git a/full_models/mfy/config.json b/full_models/mfy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mfy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mfy/vocab.txt b/full_models/mfy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5dde52492fc4227d415e1bf00365b0a25b206630 --- /dev/null +++ b/full_models/mfy/vocab.txt @@ -0,0 +1,42 @@ +| +a +e +t +u +k +i +m +n +o +j +h +b +s +r +á +é +p +ä +c +í +l +y +ü +ï +ë +ú +d +ó +ö +g +‐ +— +ñ +f +v +- +z +q +' +x + diff --git a/full_models/mfz/D_100000.pth b/full_models/mfz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bd9fc61a645c6af98781a4c2670aa2c1e1f4aca6 --- /dev/null +++ b/full_models/mfz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c871a34b17d05c95d3cdc6f653ce1e6952e52fc0d1d463dfac263ef5d491277 +size 561078749 diff --git a/full_models/mfz/G_100000.pth b/full_models/mfz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..968482f4bec59d8bb8ddc22f390caa7984b44bc0 --- /dev/null +++ b/full_models/mfz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ca662a5d5b49a715107271f78fe2345943a6a3d29e5301f4434228ffee09123 +size 436365519 diff --git a/full_models/mfz/config.json b/full_models/mfz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mfz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mfz/vocab.txt b/full_models/mfz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ae26df3676444f25f961b1d45091458d888fdd8a --- /dev/null +++ b/full_models/mfz/vocab.txt @@ -0,0 +1,31 @@ +| +a +ɛ +n +i +k +e +ɔ +y +t +o +c +ŋ +m +b +l +g +w +d +u +j +r +p +ñ +ṭ +ḍ +h +' +ç +š + diff --git a/full_models/mgd/D_100000.pth b/full_models/mgd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a6504bed3f8715e458815182ad49972e15a0e42a --- /dev/null +++ b/full_models/mgd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:734c2304ead216fabd6a2ea3074c356762a46fd01f1a574dad47210f97f2d7c0 +size 561078887 diff --git a/full_models/mgd/G_100000.pth b/full_models/mgd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e0e2e2d6a337d99e98d3aa4f2964aca7a3ecadf5 --- /dev/null +++ b/full_models/mgd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df40b6966431a3afc18aa43751420c3a0e93e203c0ebb1f88c0e2b4a695cf20 +size 436386788 diff --git a/full_models/mgd/config.json b/full_models/mgd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mgd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mgd/vocab.txt b/full_models/mgd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4839089abc630b9090a4972f6615df92febf2ec5 --- /dev/null +++ b/full_models/mgd/vocab.txt @@ -0,0 +1,40 @@ +f +c +î + +z +i +_ +m +ù +ä +n +e +v +a +h +y +à +k +p +ò +w +ì +2 +ŋ +r +t +d +b +è +j +s +l +u +g +' +í +̀ +o +- +ṛ diff --git a/full_models/mge/D_100000.pth b/full_models/mge/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2d88600f80e1fdae65bf9c18fd81eee0bfa2f62d --- /dev/null +++ b/full_models/mge/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb6257d98c6bd4bfa723a0264e5c08a14a0cf327b288ca5d27c9254f326ad87 +size 561079352 diff --git a/full_models/mge/G_100000.pth b/full_models/mge/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..03b41950a127827e8858d9a1f0bbc02528407c5b --- /dev/null +++ b/full_models/mge/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16403f3d1e96807e11b3b5658b6b8f5c55404b3f09f68dd70c2adaa4b800d194 +size 436395706 diff --git a/full_models/mge/config.json b/full_models/mge/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mge/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mge/vocab.txt b/full_models/mge/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cf72904668fb79d6dee6c659f3f8eaf512504cf0 --- /dev/null +++ b/full_models/mge/vocab.txt @@ -0,0 +1,44 @@ +ꞌ +j +ò +k +̰ +m +g +ɗ +u +w +ɨ +o +à +́ +t +_ +b +ṵ +y +s +ɛ +á +e +a +l + +ɔ +r +ḭ +i +p +é +- +̀ +– +ɓ +n +ə +d +è +ù +ó +ḛ +ú diff --git a/full_models/mgh/D_100000.pth b/full_models/mgh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e2e2a7653866ca104659efc41b3aa16308af2c14 --- /dev/null +++ b/full_models/mgh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc7a72ba64c0b2e2081494954ab6869c37b98203e2ab510ae742da727b5ff1b8 +size 561078996 diff --git a/full_models/mgh/G_100000.pth b/full_models/mgh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f6437e299b34e83f51c32f6c05c4a0eae8d3a4b --- /dev/null +++ b/full_models/mgh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64e2051f4ce24c49753b1a62fe42d12428857b20d16204464afe36d587df22c +size 436371853 diff --git a/full_models/mgh/config.json b/full_models/mgh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mgh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mgh/vocab.txt b/full_models/mgh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..76f40727651610d0f81d01767274dfbbbc84cbe4 --- /dev/null +++ b/full_models/mgh/vocab.txt @@ -0,0 +1,33 @@ +2 +- +p +u +m +o + +_ +k +' +r +f +c +y +e +i +1 +z +b +w +l +s +d +8 +0 +a +6 +n +j +t +h +v +g diff --git a/full_models/mgo/D_100000.pth b/full_models/mgo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..527b2ff29dad8c09b8bdd2e391038c3d4c4b0387 --- /dev/null +++ b/full_models/mgo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156df19b5adc1ed22b27c924218d4cbb2591c354be9b24f12eecdaf7a156a887 +size 561079268 diff --git a/full_models/mgo/G_100000.pth b/full_models/mgo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20103fdfa8efab86c0068c9e533bf869098de94c --- /dev/null +++ b/full_models/mgo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889de2af960e3a4f5331ca21bc380e32f0c98d0ce76f6a0229600df8ccaec964 +size 436413941 diff --git a/full_models/mgo/config.json b/full_models/mgo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mgo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mgo/vocab.txt b/full_models/mgo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..85619b99f04f19ca6a31cc9ea23cea77fc9c77f7 --- /dev/null +++ b/full_models/mgo/vocab.txt @@ -0,0 +1,51 @@ +l +ʼ +h +ǐ +n +ě +ŋ +g +m +ǒ +ò +̀ +ì +c +ô +ǔ +u +v +ù +f +k +z +ə +̂ +ɨ +ǎ +à +â +ê + +a +e +r +y +d +i +- +b +_ +̌ +j +û +o +p +' +è +î +s +ɔ +w +t diff --git a/full_models/mhi/D_100000.pth b/full_models/mhi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0099b0666527283c313589a1f2c4a8212e30af68 --- /dev/null +++ b/full_models/mhi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:148cb93e3a55a6e801383fd4aa28135f7014afe85ff406ee0fe3e2ee0667222d +size 561078830 diff --git a/full_models/mhi/G_100000.pth b/full_models/mhi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..71acddc8ea4e82665fc7d3e8cbf524a41fd89e2c --- /dev/null +++ b/full_models/mhi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa362673c031b594948109acfeb5ad3cc934d029ddef37663f43c9081172deb9 +size 436361937 diff --git a/full_models/mhi/config.json b/full_models/mhi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mhi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mhi/vocab.txt b/full_models/mhi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..68b2365993fd48f68586211c23d4e42bdb72056d --- /dev/null +++ b/full_models/mhi/vocab.txt @@ -0,0 +1,29 @@ +| +i +a +r +o +n +u +e +d +k +l +s +b +' +t +m +y +g +j +z +v +p +w +c +h +f +- +— + diff --git a/full_models/mhr/D_100000.pth b/full_models/mhr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b9d6cace0debe7b3ba94bb443ad49e2a14444b3 --- /dev/null +++ b/full_models/mhr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41d3cf713c1bf37d7922e2d2e40b00e3a630a16f6030f86a4f396683e953e68e +size 561078872 diff --git a/full_models/mhr/G_100000.pth b/full_models/mhr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..786ee223b5ff79ef9dccc50485281ca8cb2658f1 --- /dev/null +++ b/full_models/mhr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a5434cb814b2f0e40a21fc8ce16954e6c3c657ce97b26ee45a03841bcecc7b8 +size 436391233 diff --git a/full_models/mhr/config.json b/full_models/mhr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mhr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mhr/vocab.txt b/full_models/mhr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c0a8c8d00e1dc23a5975be35c8a37c90a961d432 --- /dev/null +++ b/full_models/mhr/vocab.txt @@ -0,0 +1,42 @@ +ӧ +п +я +б +ш +т +х +1 +щ +а +ж +ы +ӱ +е +4 +р +- +– + +н +в +и +с +з +ч +ҥ +о +м +ъ +г +' +й +ь +ю +л +ф +_ +ц +к +д +э +у diff --git a/full_models/mhu/D_100000.pth b/full_models/mhu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..884b505ee449998503fe5062c8dc73d20b9740a9 --- /dev/null +++ b/full_models/mhu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1c7b3aab59822be6594a7fc399bdfd7426e00c9f19c05bba47817b5b8a4105 +size 561076055 diff --git a/full_models/mhu/G_100000.pth b/full_models/mhu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff5cf3bfacfa7a2ad7c6e3ba1850eb1bc98bedf6 --- /dev/null +++ b/full_models/mhu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea86ae5d4985678b230d521545aa176dc84ee1998dda3de661a102e7bda40938 +size 436350427 diff --git a/full_models/mhu/config.json b/full_models/mhu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mhu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mhu/vocab.txt b/full_models/mhu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7d8414fee7c8d64262f5c50b8ed625fe097ba3c1 --- /dev/null +++ b/full_models/mhu/vocab.txt @@ -0,0 +1,34 @@ +̃ +- +q +' +k +p +u +h +ũ +a +d +s +r +_ +ü +v +n +c +l +o +g +ẽ +z +e +ǃ +t +ã +j +y +m + +w +b +i diff --git a/full_models/mhx/D_100000.pth b/full_models/mhx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5cfb7cc9eea9e2f435a70ac3aca0d75145259310 --- /dev/null +++ b/full_models/mhx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8db4e03a9a0e02646f32e463d241623691b50d47b04d949041e95d033631af +size 561078735 diff --git a/full_models/mhx/G_100000.pth b/full_models/mhx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6c4c8ef9495e6e59605a7a8619591473aee9b89e --- /dev/null +++ b/full_models/mhx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d12735ca03bfc3711a133c4b910ac48b2544e503e5bc92dd5f62afb633148072 +size 436373332 diff --git a/full_models/mhx/config.json b/full_models/mhx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mhx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mhx/vocab.txt b/full_models/mhx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..15e932763210065d7e45f8abd37b2cb5ade6901e --- /dev/null +++ b/full_models/mhx/vocab.txt @@ -0,0 +1,35 @@ +o +k +e +1 +g +b +x +q +p +n +- +a +i +0 +' +6 +f + +c +t +w +s +y +v +4 +d +2 +u +r +j +_ +m +z +h +l diff --git a/full_models/mhy/D_100000.pth b/full_models/mhy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f23dce7937468b41c6ac11600372dd55bbc1f3a1 --- /dev/null +++ b/full_models/mhy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a7d1c8111b9d1d09f4883168142cb7b99a19f08151bdc2ad721cfd3686aacc1 +size 561079140 diff --git a/full_models/mhy/G_100000.pth b/full_models/mhy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dfadb682295b5596cc320f252c56be3f66eab4ea --- /dev/null +++ b/full_models/mhy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e267df9b9473f988d3ba52086358526d9b5526f6bcb65fd0d99db7c35320acb9 +size 436369627 diff --git a/full_models/mhy/config.json b/full_models/mhy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mhy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mhy/vocab.txt b/full_models/mhy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0ed171ff909753253aaacedeffa93c83b6866998 --- /dev/null +++ b/full_models/mhy/vocab.txt @@ -0,0 +1,33 @@ + +j +r +p +a +y +u +h +1 +l +4 +5 +_ +n +3 +b +t +d +e +m +k +2 +s +w +o +c +z +0 +f +- +i +6 +g diff --git a/full_models/mib/D_100000.pth b/full_models/mib/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..23844d58049e780e30403d9364e327760fb2e7ad --- /dev/null +++ b/full_models/mib/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf05fbd5d920fb83da107c8b0788db833914615576126f426a3e9faf5ba2c7d +size 561078876 diff --git a/full_models/mib/G_100000.pth b/full_models/mib/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ec03534aafc5d173e126056344f7c47211603582 --- /dev/null +++ b/full_models/mib/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd7d9c9964ba60504418544c70fea062645a87097bc3c168986fdd273d2fa60e +size 436392171 diff --git a/full_models/mib/config.json b/full_models/mib/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mib/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mib/vocab.txt b/full_models/mib/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..03f67eed7550958ef6475b39b1f9e52c1515cf2a --- /dev/null +++ b/full_models/mib/vocab.txt @@ -0,0 +1,43 @@ +á +j +ā +p +c +l + +ñ +a +í +‐ +u +x +h +i +s +n +- +g +ó +k +́ +q +e +é +z +ɨ +v +r +ō +t +ē +y +f +ū +b +m +d +o +_ +ī +̄ +ú diff --git a/full_models/mie/D_100000.pth b/full_models/mie/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c81f0e2f2a382493bb62122eb5ebd6837d0d4e2a --- /dev/null +++ b/full_models/mie/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e44395b9b1ddbd14027f1e4c265b200f2348e74b53e52396c1421bcf3df80086 +size 561078896 diff --git a/full_models/mie/G_100000.pth b/full_models/mie/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4bf205f377bc5c0eb4521307ec85e57f2c0504c0 --- /dev/null +++ b/full_models/mie/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d1dba9fd80f6125a346325b6b58582ea74c6b386cc6ee2c08fd2ae6fb2ab3f +size 436383585 diff --git a/full_models/mie/config.json b/full_models/mie/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mie/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mie/vocab.txt b/full_models/mie/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b62025a2ca119faf196a30c4452c64e28126ee2b --- /dev/null +++ b/full_models/mie/vocab.txt @@ -0,0 +1,39 @@ +b +ē +g +ī +c +á +z +é +ū +_ +- +f +ō +x +h +k +a +y +s +r + +j +o +v +ó +m +t +u +ñ +í +ā +e +n +d +q +p +i +l +ú diff --git a/full_models/mif/D_100000.pth b/full_models/mif/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2083be435248cad2cf3d1131489ea132edd16525 --- /dev/null +++ b/full_models/mif/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3221d66746c4a55952119c56482a6d98f6dc94c4801c70e259fc6f8d4636d343 +size 561078232 diff --git a/full_models/mif/G_100000.pth b/full_models/mif/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ea6870287c1fd3e96f9988b7d5e1a56f89abe7a2 --- /dev/null +++ b/full_models/mif/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7012efbedb6e1d2d49fe2c309e4c396a8bd0cb8606addeb87a15ac2eee72ba2 +size 436361897 diff --git a/full_models/mif/config.json b/full_models/mif/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mif/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mif/vocab.txt b/full_models/mif/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8934e87e04bd83be086699e74af388e114fc3c16 --- /dev/null +++ b/full_models/mif/vocab.txt @@ -0,0 +1,31 @@ +a +| +y +e +m +ə +d +w +r +l +k +g +n +s +h +t +ŋ +b +z +v +u +f +ɗ +c +i +p +j +- +ɓ +' + diff --git a/full_models/mih/D_100000.pth b/full_models/mih/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..33fb642f18f2852e5344dc1daf01f4bc1564902f --- /dev/null +++ b/full_models/mih/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eff41a35521a093cf16c7c2e1fd139cf51910ac3f03d26ada84f8c8e574f436 +size 561078731 diff --git a/full_models/mih/G_100000.pth b/full_models/mih/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..76e303a98e616e50a448bb55c514a31498caa2a3 --- /dev/null +++ b/full_models/mih/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ec494d37bb14bd85379bdf43808715478b19900631b55501532e5ed591e9d3 +size 436378189 diff --git a/full_models/mih/config.json b/full_models/mih/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mih/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mih/vocab.txt b/full_models/mih/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..10f0535955ee5ef3916d5e73bccac8d296b42180 --- /dev/null +++ b/full_models/mih/vocab.txt @@ -0,0 +1,38 @@ +g +q +l +e +r +ꞌ +_ +p +ú +u +s +n +o +j +ó +a +ñ +m +y +á +v +é +x +' +c +ɨ +z +i +t +f +̱ +b +k + +í +́ +d +h diff --git a/full_models/mil/D_100000.pth b/full_models/mil/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..34d53202bc5f7f28b50395891ef0b00e040e171e --- /dev/null +++ b/full_models/mil/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b6b6d3e89d86b33aa653f813e9e4a2f2f7ff105e587622d33637d5638aab300 +size 561078120 diff --git a/full_models/mil/G_100000.pth b/full_models/mil/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..59cb8f8b37983a963a2f85a6c3269726f0e2e6fe --- /dev/null +++ b/full_models/mil/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c26a493d1ec82e57bf6ffd4b1577857f14099f962662b27968a6c3762a42ed +size 436405694 diff --git a/full_models/mil/config.json b/full_models/mil/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mil/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mil/vocab.txt b/full_models/mil/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e69940901623840d138ddfea7141b3e3324af617 --- /dev/null +++ b/full_models/mil/vocab.txt @@ -0,0 +1,50 @@ +a +g +ú +á +̀ + +q +c +í +s +o +ǐ +h +ǔ +j +z +ü +e +l +— +_ +t +y +ɨ +ó +n +i +d +è +m +p +v +̌ +b +à +ù +ǎ +k +ñ +‐ +ì +é +r +ǒ +́ +ò +u +ě +x +f diff --git a/full_models/mim/D_100000.pth b/full_models/mim/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b72a73bc4339e7cd13fe74ef11218ab18938792 --- /dev/null +++ b/full_models/mim/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae14266abaaa06de1451a6f2cf487b1cc17d3656a2c99a8eab5f832c0847d7a +size 561076186 diff --git a/full_models/mim/G_100000.pth b/full_models/mim/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f2d1616410bc0f21c74b9d71a1c052a41f17cb9 --- /dev/null +++ b/full_models/mim/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:208a95e5a6fd814fb8825fcd7b682fafac7f96f15bf9a5b31e8c9159997d12fa +size 436358186 diff --git a/full_models/mim/config.json b/full_models/mim/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mim/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mim/vocab.txt b/full_models/mim/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9fcd4a16632c6beddbf83cced8e103085719061b --- /dev/null +++ b/full_models/mim/vocab.txt @@ -0,0 +1,37 @@ +r +d +o +e +x +v +p +g +é +c +‐ +b + +j +l +ꞌ +_ +h +n +q +k +i +ñ +' +ó +z +a +s +u +m +f +̱ +ú +t +í +á +y diff --git a/full_models/min/D_100000.pth b/full_models/min/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1dd447dc9c0a793563170a543d51b32c823a4e0f --- /dev/null +++ b/full_models/min/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7699c1196f4b96b032ee605a6634958950f9dc288967b2d4416d35524eca261 +size 561078599 diff --git a/full_models/min/G_100000.pth b/full_models/min/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..90702acf12f0c41f4b6396a76ea497aeef6c1a28 --- /dev/null +++ b/full_models/min/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b0b4c763ce8984b1ce892008b29009f9e77f00bb8224273ad09dfccb423b1d +size 436371382 diff --git a/full_models/min/config.json b/full_models/min/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/min/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/min/vocab.txt b/full_models/min/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fa7555903e4e058521e3a7be2a7c15fc46197da9 --- /dev/null +++ b/full_models/min/vocab.txt @@ -0,0 +1,35 @@ +a +| +n +k +i +u +o +t +m +d +s +r +b +l +g +h +- +p +y +e +j +w +c +f +z +' +— +0 +4 +6 +1 +2 +5 +3 + diff --git a/full_models/mio/D_100000.pth b/full_models/mio/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5cef90aed873623485d5b18fdcb0515268aa2d07 --- /dev/null +++ b/full_models/mio/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6544a1db11390977550afaae48600787dae1a97bc474bef17adf1bc64cde743e +size 561078580 diff --git a/full_models/mio/G_100000.pth b/full_models/mio/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..979c242400b12c80245168d7bb9724cbf22fdd8d --- /dev/null +++ b/full_models/mio/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58cfa00bc80640916f55317d07facfe273fa868bc962076c84cf0a55075ffcd4 +size 436371486 diff --git a/full_models/mio/config.json b/full_models/mio/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mio/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mio/vocab.txt b/full_models/mio/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d55c89d259cc9b7ae8f2f896cb2ff0fd6b025552 --- /dev/null +++ b/full_models/mio/vocab.txt @@ -0,0 +1,35 @@ +| +a +i +c +n +u +h +t +o +d +r +v +ñ +s +e +y +q +m +x +j +l +p +b +g +f +z +ρ +̄ +- +í +ó +k +é +á + diff --git a/full_models/mip/D_100000.pth b/full_models/mip/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cca3948824ccddecf87ceed5fcdfb932c1f8c7ec --- /dev/null +++ b/full_models/mip/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432407a851eaa964c63540952cdbbc92a19b67c90204ba81be9a679ce2eb6b88 +size 561079383 diff --git a/full_models/mip/G_100000.pth b/full_models/mip/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f7a8a7c1ee88134a8286ead524188e3dbfba8e6 --- /dev/null +++ b/full_models/mip/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c58cccfde17c23201123a7078f7a71fe5426ebafae0e19e9cb76a5e90a5f749 +size 436388980 diff --git a/full_models/mip/config.json b/full_models/mip/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mip/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mip/vocab.txt b/full_models/mip/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..387a79b860a2f9941b2b85739f098ad1cf17c4e2 --- /dev/null +++ b/full_models/mip/vocab.txt @@ -0,0 +1,40 @@ +s +c +a +y +ü +u +̶ +ú +̱ +x +m +t +d +e +p +5 +q +ñ +r +g +ó +v +í +- +k +— +h +i +j +é +á +n +_ +o +f +b +ꞌ + +z +l diff --git a/full_models/miq/D_100000.pth b/full_models/miq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d4db7960cdef001d10c019f1f44724b47daa461 --- /dev/null +++ b/full_models/miq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d93e329c0c718b1c4974ebc112ec9c41ff1782df6099a298332e7658a7968224 +size 561078853 diff --git a/full_models/miq/G_100000.pth b/full_models/miq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8c68a8ffa43800feb7b279754607f7ed13be4468 --- /dev/null +++ b/full_models/miq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:779301609e7b2228a01b313c750a06c3fdb6eba3553817df9f3acf035eff1017 +size 436387455 diff --git a/full_models/miq/config.json b/full_models/miq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/miq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/miq/vocab.txt b/full_models/miq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..86a134241ccc98f5327b1c816288957ddbdcf08b --- /dev/null +++ b/full_models/miq/vocab.txt @@ -0,0 +1,41 @@ +a +| +i +n +k +b +r +s +u +l +m +t +w +p +d +h +y +g +â +e +j +- +î +o +' +0 +1 +7 +2 +4 +5 +3 +6 +û +9 +8 +ê +f +v +ô + diff --git a/full_models/mit/D_100000.pth b/full_models/mit/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1000efeb8bdb70f6b4b3217239908d1e6fd82746 --- /dev/null +++ b/full_models/mit/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0bd22690d0bd693171f36ea5a21b9b9134a5ef3e0dfcc34f17f4dceb75f5fb0 +size 561078476 diff --git a/full_models/mit/G_100000.pth b/full_models/mit/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e63aa244738584972febcea27c0f05f8318420d6 --- /dev/null +++ b/full_models/mit/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9928824e37f68455e10334a0a1211a2bb9b82bb2f203f3c7cded43607994d35a +size 436408137 diff --git a/full_models/mit/config.json b/full_models/mit/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mit/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mit/vocab.txt b/full_models/mit/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..652d92b03f9e2f23b7986c44297f36ff19247ba6 --- /dev/null +++ b/full_models/mit/vocab.txt @@ -0,0 +1,51 @@ +| +n +i +a +c +à +u +d +h +‐ +ì +s +á +t +e +ù +í +o +v +m +x +è +y +ñ +ú +r +é +q +ó +l +g +p +ò +j +b +â +î +f +z +ˋ +ê +ˊ +û +ô +ü +9 +k +3 +4 +0 + diff --git a/full_models/miy/D_100000.pth b/full_models/miy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cb17c60cb9a1917ca71f426dc3c8078d13f9d16d --- /dev/null +++ b/full_models/miy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d7ef5202f6a25e0d5cfa81057fe4eaa8344d7fb36da35738147c6e85d20e9d4 +size 561076183 diff --git a/full_models/miy/G_100000.pth b/full_models/miy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d3020fa85e7b5134d8bd3b5263ca18e5568b8c55 --- /dev/null +++ b/full_models/miy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145bf819b5b5779962c5d83f613ecbc3e14862876647dd155634bd1832f8db7e +size 436367287 diff --git a/full_models/miy/config.json b/full_models/miy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/miy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/miy/vocab.txt b/full_models/miy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7628453aac551e1c0ac4730d96ea0bd9a70c6499 --- /dev/null +++ b/full_models/miy/vocab.txt @@ -0,0 +1,41 @@ +_ +n +̱ +m +ë +y +ú +g +c +h +ó +ñ +ö +j +ü +á +p +o +z +k +e +t +ꞌ +l +u +f +i +ï +r +v +q +d +­ +s +é + +x +ä +a +í +b diff --git a/full_models/miz/D_100000.pth b/full_models/miz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..13e85d144d7b106c604d4bc819e2891b3a34777f --- /dev/null +++ b/full_models/miz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e531c9cc43b211f0629b38e1f93c22d27d5354a078306f77be86399c52d21226 +size 561079392 diff --git a/full_models/miz/G_100000.pth b/full_models/miz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..786cf8d871fd0677b563db03136a12eb19f9f784 --- /dev/null +++ b/full_models/miz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b53d1b95f3d5b532a6585b02b0d2fab74981fa83aa8485ee42a41866250ddab +size 436410543 diff --git a/full_models/miz/config.json b/full_models/miz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/miz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/miz/vocab.txt b/full_models/miz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5a1342bad718efb38110e17487990f80903bd7dc --- /dev/null +++ b/full_models/miz/vocab.txt @@ -0,0 +1,50 @@ +â +o +ē +y +e +u +d +g +ú +c +— +û +̂ +í +f +ō +s +ñ +i +v +k +̄ +ó +ā +́ +x +ī +p +j +b +n +l +ꞌ +q +t +r +h +ô +á + +ê +î +m +é +_ +a +ū +z +ɨ +ʼ diff --git a/full_models/mjl/D_100000.pth b/full_models/mjl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5e139f9f68c7c5cef0312ff7ef1b62a447725a6f --- /dev/null +++ b/full_models/mjl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f3fbc20464e9ec028134f1aa7d3a3a59ffa14d9dc0e25d7125030813d8a1ce +size 561077941 diff --git a/full_models/mjl/G_100000.pth b/full_models/mjl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d508f9d453e33511e1146493bbe6d768ba0c5775 --- /dev/null +++ b/full_models/mjl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea534dbe1d92d176b0b650bded60f3ef2f18c2c8db83261de3ee97ace9a1144 +size 436429038 diff --git a/full_models/mjl/config.json b/full_models/mjl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mjl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mjl/vocab.txt b/full_models/mjl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cdc61f7ede663299fb486170efb759a4e138a746 --- /dev/null +++ b/full_models/mjl/vocab.txt @@ -0,0 +1,63 @@ +| +ा +े +र +् +स +ह +क +ी +ि +ो +त +न +ं +म +ल +ज +य +प +ु +द +ब +ण +आ +ग +ू +व +ई +च +ख +भ +ए +ड +झ +़ +थ +ै +ठ +ध +ऊ +अ +ँ +ऐ +इ +फ +उ +ट +छ +ौ +- +ढ +घ +ः +ओ +ञ +' +ष +ृ +औ +2 +0 +7 + diff --git a/full_models/mjv/D_100000.pth b/full_models/mjv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..166c9605f913057631d0c899afd81ca8aea7a064 --- /dev/null +++ b/full_models/mjv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbd407a4f1529ee905478aa84f9a1f4804f5be6f13abbe0e0b3c93012147dd86 +size 561079482 diff --git a/full_models/mjv/G_100000.pth b/full_models/mjv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8c60e2a4e41eb40d88d6952e9eb53ad996a5a0de --- /dev/null +++ b/full_models/mjv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2991971843afe10021614254fbf8ec509f42318b154a65bf2819ee47310b14a +size 436421177 diff --git a/full_models/mjv/config.json b/full_models/mjv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mjv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mjv/vocab.txt b/full_models/mjv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b115ac9a665864dc1f1cba8b188fc3d7d03633a2 --- /dev/null +++ b/full_models/mjv/vocab.txt @@ -0,0 +1,54 @@ +ള +ത +ി +ന +ൽ +ല +പ +േ + +ഞ +ം +എ +ു +ച +ൺ +ൂ +ർ +ആ +ണ +ോ +ഒ +6 +ീ +അ +' +ട +ഇ +ഈ +ങ +ജ +ഓ +3 +ഏ +ൾ +ാ +0 +െ +- +യ +റ +‍ +ശ +ഉ +് +4 +ഊ +വ +ക +ൊ +ൻ +ബ +ര +_ +മ diff --git a/full_models/mkl/D_100000.pth b/full_models/mkl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6e4206af85a8c2b1662a9af2dce927924f3dd379 --- /dev/null +++ b/full_models/mkl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ddac3464b0f41c951985c24e97607ecd40786d25a6c65d922968da2fcd14c97 +size 561078970 diff --git a/full_models/mkl/G_100000.pth b/full_models/mkl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c741247f85bf3f24f28632bfa26a822502d1f3df --- /dev/null +++ b/full_models/mkl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9baa6f7d5697523df159880f664ed43e68bdb2c213a06bbe05137058e70a898e +size 436405551 diff --git a/full_models/mkl/config.json b/full_models/mkl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mkl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mkl/vocab.txt b/full_models/mkl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..22add8bd11bed7958230a8031933d8eec0d180ad --- /dev/null +++ b/full_models/mkl/vocab.txt @@ -0,0 +1,48 @@ +| +ɑ +i +ɛ +n +ɔ +u +k +e +m +b +ŋ +s +o +d +w +y +l +̃ +í +j +̀ +t +g +f +c +r +p +h +́ +a +ù +z +ǹ +ì +ĩ +ò +ũ +à +v +ú +á +ń +é +ó +1 +è + diff --git a/full_models/mkn/D_100000.pth b/full_models/mkn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5364432170bde77ab499e7158b8476eb5218dd94 --- /dev/null +++ b/full_models/mkn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e746ca87fd1e2788c3b75603b5f0623a641c8cf32a936e13cc96a01f5d36088 +size 561076027 diff --git a/full_models/mkn/G_100000.pth b/full_models/mkn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0849deee73e7b574581488f6d058eb58880569b9 --- /dev/null +++ b/full_models/mkn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d246033ae2f871d683f2bb12780023d7bdc46a557b3d982ddad9433fb780696 +size 436342959 diff --git a/full_models/mkn/config.json b/full_models/mkn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mkn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mkn/vocab.txt b/full_models/mkn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a5d301a9d75bfc3b9c6ca58c8588403d3c28aa7b --- /dev/null +++ b/full_models/mkn/vocab.txt @@ -0,0 +1,31 @@ +g +m + +t +c +k +e +f +y +w +_ +l +n +h +i +u +í +b +á +o +é +a +- +r +d +p +j +' +s +ó +ú diff --git a/full_models/mlg/D_100000.pth b/full_models/mlg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..88fb8abafa14e5020d57ffd0c189409030eb724f --- /dev/null +++ b/full_models/mlg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c07443fdca3a54e2b2e4b274224016bdc004f04462bf4af8ee41b80b630b2631 +size 561078243 diff --git a/full_models/mlg/G_100000.pth b/full_models/mlg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5920e0a5b604530a26d8bfdb1378a61371eee841 --- /dev/null +++ b/full_models/mlg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc924fff8a15863c1ced9b2f1a8e24dcb536f3cf112019b65463a53f18b9427f +size 436356368 diff --git a/full_models/mlg/config.json b/full_models/mlg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/mlg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mlg/vocab.txt b/full_models/mlg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..740ac2c9b2ee51406e390981f4fdf999a89c6635 --- /dev/null +++ b/full_models/mlg/vocab.txt @@ -0,0 +1,30 @@ +a +| +n +i +y +o +r +t +m +e +h +s +k +f +z +d +l +' +v +p +b +j +- +g +à +ỳ +ô +ò +ì + diff --git a/full_models/mmg/D_100000.pth b/full_models/mmg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6444990f18a8241f2d4b91ab24d4c130b2d8046d --- /dev/null +++ b/full_models/mmg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53348388d2aa2f35992785c476e355da61b182f34a594d2014799d7966be6a36 +size 561076030 diff --git a/full_models/mmg/G_100000.pth b/full_models/mmg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c937535ce5e964ebf8fd43d0e949664d990cc1a1 --- /dev/null +++ b/full_models/mmg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86d10371f7cd797245705ca34a8a0d35c7f3a9517806568b3f95ff31d61a98bb +size 436349872 diff --git a/full_models/mmg/config.json b/full_models/mmg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mmg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mmg/vocab.txt b/full_models/mmg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b32754be1c50f5bb4a8a1256e63e6a3ded138824 --- /dev/null +++ b/full_models/mmg/vocab.txt @@ -0,0 +1,34 @@ +b +9 +6 +m +n +r +o +u +i +f +3 +s +8 +l +y +g +0 +1 +v +k +7 +w +e +- +_ +ō +j +a +2 + +h +4 +t +5 diff --git a/full_models/mnb/D_100000.pth b/full_models/mnb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..030a7fd285a2bbf59f77686f7d08cf69df50b28c --- /dev/null +++ b/full_models/mnb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce799c2ab0c18aa2606091393cf0dddf48fd960b5eca1432e61bb047d0706151 +size 561078760 diff --git a/full_models/mnb/G_100000.pth b/full_models/mnb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..35a137f5001f2fd9994ec2680230b3ef6a64a040 --- /dev/null +++ b/full_models/mnb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59c355e4e18e895d8b0902c7f660f97138bc13c3b67e706844da36b7305e139 +size 436351662 diff --git a/full_models/mnb/config.json b/full_models/mnb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mnb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mnb/vocab.txt b/full_models/mnb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24bf82e9d462b064fef749a44dd2c1be9d421232 --- /dev/null +++ b/full_models/mnb/vocab.txt @@ -0,0 +1,25 @@ +a +| +o +n +i +e +m +u +h +k +t +d +s +' +l +b +p +w +g +f +r +- +y +z + diff --git a/full_models/mnf/D_100000.pth b/full_models/mnf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5ce2e150ebc0be5e4a2150d92f2a08bc8342acea --- /dev/null +++ b/full_models/mnf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186d55627dd9456a87a7956112245f649aab91ca40ea791bbd7fef3b54cf4daa +size 561078767 diff --git a/full_models/mnf/G_100000.pth b/full_models/mnf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c1a65345169cfc5156e12955b620f4b51c2b4f2e --- /dev/null +++ b/full_models/mnf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f4d37649e55e10495eb646eba6c10017f04aceb317595d16c54206ec11ab92 +size 436410548 diff --git a/full_models/mnf/config.json b/full_models/mnf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mnf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mnf/vocab.txt b/full_models/mnf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8cc1aa9bfba973e4d7bd97ec86e80196e06b7d35 --- /dev/null +++ b/full_models/mnf/vocab.txt @@ -0,0 +1,52 @@ +| +a +b +n +à +t +e +m +ɨ +ɔ +è +̧ +l +̀ +k +u +w +s +ˈ +g +i +ò +y +h +ŋ +d +ə +ê +f +o +z +ì +ù +̂ +p +ǎ +ȩ +j +û +v +â +̌ +ě +ǔ +ǒ +c +ǐ +î +ô +' +- + diff --git a/full_models/mnk/D_100000.pth b/full_models/mnk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..89067704fb55fc2f5110e6e2a0b154caf3e0a94c --- /dev/null +++ b/full_models/mnk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c62a7ac847f22687e56cbc745f08baa2a582c0b7273841e198d8c8baba02bb2 +size 561078636 diff --git a/full_models/mnk/G_100000.pth b/full_models/mnk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8c7cc750a152504942345358072c2931c25fe6d8 --- /dev/null +++ b/full_models/mnk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb1fb408cdcf37673edd77c2ed67142abb0c32f856d21f8d861286123bd6142 +size 436364788 diff --git a/full_models/mnk/config.json b/full_models/mnk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mnk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mnk/vocab.txt b/full_models/mnk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..420d1a4dfcc46eabdffd361e8bacc72c5d805ebe --- /dev/null +++ b/full_models/mnk/vocab.txt @@ -0,0 +1,31 @@ +| +a +o +i +e +l +u +n +k +t +ŋ +m +b +y +s +r +d +w +f +ñ +j +ì +h +- +p +ǹ +̀ +à +c +' + diff --git a/full_models/mnw/D_100000.pth b/full_models/mnw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..86a4e56a4e3f717e49dacd100407c4f1d51a6852 --- /dev/null +++ b/full_models/mnw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2431443f3617a4a1d5509bea56684b6a1e54586c56872f6a3967765526b5dbb +size 561078846 diff --git a/full_models/mnw/G_100000.pth b/full_models/mnw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1c414deb68aaf0bfe0ad10434b6e923aa24a875a --- /dev/null +++ b/full_models/mnw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327895ea2cb878ffa04c24b0cca875d5f55cbe3802bfb29adceb3d8630ad92cf +size 436431823 diff --git a/full_models/mnw/config.json b/full_models/mnw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mnw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mnw/vocab.txt b/full_models/mnw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b7f26c480656d6693a53b00890a03cac8a1a1d31 --- /dev/null +++ b/full_models/mnw/vocab.txt @@ -0,0 +1,60 @@ +ၝ +ါ +၆ +ဥ +ဗ +ဓ +ဍ +ၠ +ၚ +မ +ပ +ရ +ဴ +ၟ +လ +သ +ွ +ယ +ဨ +ဘ +အ +တ +ည + +ခ +ထ +ဣ +ဳ +ူ +က +ိ +ေ +ဒ +ီ +ျ +ဵ +ၜ +ဩ +_ +ဂ +ဇ +ဲ +ှ +္ +ဟ +် +ြ +စ +ံ +န +ဝ +ု +ဏ +ဖ +ဃ +ၞ +း +ဿ +ာ +ဆ diff --git a/full_models/mnx/D_100000.pth b/full_models/mnx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ede0070e27b7206bb4e2520437be2645638dbbab --- /dev/null +++ b/full_models/mnx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e5062d0cf332dd411685ab8e6c2b1146146aa5b066154f3fbfb24c6f71a570a +size 561076153 diff --git a/full_models/mnx/G_100000.pth b/full_models/mnx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d087a06daf5462e2dfb97b65fc1ed9be7302863d --- /dev/null +++ b/full_models/mnx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f3d98e02371e4c133ae60ccf4f8c4ed3a7d4c00605615f78fba6f40b47196f +size 436328250 diff --git a/full_models/mnx/config.json b/full_models/mnx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mnx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mnx/vocab.txt b/full_models/mnx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b6de82747d05fe3d273b3d0f5583f3f74d2234c4 --- /dev/null +++ b/full_models/mnx/vocab.txt @@ -0,0 +1,24 @@ +j +u +c + +s +w +k +g +y +f +t +p +m +o +e +i +h +d +a +n +r +b +l +_ diff --git a/full_models/moa/D_100000.pth b/full_models/moa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff80644d1b29a7c070698268215ec769cd104d20 --- /dev/null +++ b/full_models/moa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e72c25d181a5cada300049f54fec318878e4ee917bd49f99dc8398ba951303 +size 561078590 diff --git a/full_models/moa/G_100000.pth b/full_models/moa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ee131598e8320e082da0835ad2ffe4dcc059907 --- /dev/null +++ b/full_models/moa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8affcca64e93003391c3b3ca4b0e9754b8cbd6251c240bb8527813703dc7a80 +size 436364457 diff --git a/full_models/moa/config.json b/full_models/moa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/moa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/moa/vocab.txt b/full_models/moa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e70e37ddfe30578dbb7fc851d4fda4ccd7f4f5c0 --- /dev/null +++ b/full_models/moa/vocab.txt @@ -0,0 +1,32 @@ +d +ɛ +a +_ +v +u +o +q +c +w +z +h +n +g +' +ɔ +- +i +t +b +f +k +s +e +m +ŋ + +j +y +p +r +l diff --git a/full_models/mog/D_100000.pth b/full_models/mog/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49908592e3f72a9b88c5befa64e3895506c7627b --- /dev/null +++ b/full_models/mog/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab333b83ab2146fd8861d7933ea7a9a544f011f66a01ecf24fbad2a0f1a6eef +size 561078700 diff --git a/full_models/mog/G_100000.pth b/full_models/mog/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..87df1fbebb7339c3903c3caec255e081e0b6e97c --- /dev/null +++ b/full_models/mog/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:163e6c1f3948d616ce6794b7272af7e3eaa0424fe327837669702f1a29d6bf87 +size 436375859 diff --git a/full_models/mog/config.json b/full_models/mog/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mog/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mog/vocab.txt b/full_models/mog/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f27311ef9c2ef617a92ddac6391668ece606438b --- /dev/null +++ b/full_models/mog/vocab.txt @@ -0,0 +1,37 @@ +| +a +n +o +i +t +m +u +k +g +b +d +s +' +p +y +r +e +l +á +h +í +ḷ +w +- +ḻ +ú +j +ó +c +é +z +0 +4 +f +1 + diff --git a/full_models/mon/D_100000.pth b/full_models/mon/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81abc4ad77cacf34e7b167de648814bc1e5dba86 --- /dev/null +++ b/full_models/mon/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be5b7d92fdf7a08ab7dcc8da5cd22301b6fd01088a001518f86091178b521f34 +size 561078628 diff --git a/full_models/mon/G_100000.pth b/full_models/mon/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a9ee1c9640701d5f3b2a26043d16da934e66f0e8 --- /dev/null +++ b/full_models/mon/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c7f100a396236d4425eb0b2d01cd9ed218521c9d0bd2063adde06550f921b9 +size 436438174 diff --git a/full_models/mon/config.json b/full_models/mon/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mon/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mon/vocab.txt b/full_models/mon/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..59428b93016f7acb0560edd30fb009784115c514 --- /dev/null +++ b/full_models/mon/vocab.txt @@ -0,0 +1,64 @@ +| +а +э +н +г +р +д +и +х +ү +л +т +й +о +у +с +б +ѳ +м +ч +в +ж +ь +з +ы +е +щ +ц +я +ю +— +ё +п +к +ф +ъ +j +l +e +b +p +i +m +f +n +x +g +r +q +v +s +c +d +w +k +u +o +y +z +a +t +h +- + diff --git a/full_models/mop/D_100000.pth b/full_models/mop/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e0c5e9a6d68110b713c277253f9fa6b81348e9c --- /dev/null +++ b/full_models/mop/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27432788c4df4f18a043ec67bbd64fc2c582663fddd38e770316e696275c11c6 +size 561077420 diff --git a/full_models/mop/G_100000.pth b/full_models/mop/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3531bdb262bc8c6c2c75377fb87423c261613b55 --- /dev/null +++ b/full_models/mop/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1ba0838b69a592b8a78a8162445e6abf321ac8fb52c1666f17877497a8ae54 +size 436391994 diff --git a/full_models/mop/config.json b/full_models/mop/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mop/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mop/vocab.txt b/full_models/mop/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..05a96354c3352a8e92d7fdfe387897695a753e48 --- /dev/null +++ b/full_models/mop/vocab.txt @@ -0,0 +1,44 @@ +| +a +' +i +u +e +c +t +o +l +n +j +b +s +m +y +h +x +q +p +w +d +ü +z +r +— +g +- +f +v +é +0 +у +2 +1 +k +ñ +3 +5 +6 +4 +9 +7 + diff --git a/full_models/mor/D_100000.pth b/full_models/mor/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..40fea6677d0da2d942a59cad5b2da315a198702c --- /dev/null +++ b/full_models/mor/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673c1e0fe0206bb3ef1b19ff84324f20127f919ef15827e3e9c0eebd54f65bdf +size 561078863 diff --git a/full_models/mor/G_100000.pth b/full_models/mor/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1bc83ffcefff2917abc886701c567099c1cd8e73 --- /dev/null +++ b/full_models/mor/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c151b1e8d20747f72d5748b298d64d454c1b278c7be5ad6f563cac6ed71bbc0d +size 436373753 diff --git a/full_models/mor/config.json b/full_models/mor/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mor/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mor/vocab.txt b/full_models/mor/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ba04fab90acc40248a379be0d330f0949cc92a25 --- /dev/null +++ b/full_models/mor/vocab.txt @@ -0,0 +1,34 @@ +| +a +i +n +ǝ +e +ŋ +l +r +đ +g +ṯ +o +u +m +ɽ +w +ñ +d +ë +b +s +y +c +t +f +k +p +j +ḏ +- +v +' + diff --git a/full_models/mos/D_100000.pth b/full_models/mos/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..4988fb3ddc6d2e4875713dc5fffec87cccf9a073 --- /dev/null +++ b/full_models/mos/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e569b8ac03fea31f853af4218d22c2244038d166f3a8f5ea1fdc9a6840b6b99 +size 561079222 diff --git a/full_models/mos/G_100000.pth b/full_models/mos/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..2098713cb2825c8d95cde56409e5b9528402efdd --- /dev/null +++ b/full_models/mos/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a70d00136490c8c1a3761bbe67f174c7dfe157007dc0b1c43901ccc495c3eb +size 436376904 diff --git a/full_models/mos/config.json b/full_models/mos/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mos/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mos/vocab.txt b/full_models/mos/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..59b4e0f611c510c1671a24ce5aad1b441150335d --- /dev/null +++ b/full_models/mos/vocab.txt @@ -0,0 +1,35 @@ +| +a +n +e +b +m +g +s +o +y +d +l +t +ẽ +i +k +ã +r +ɩ +- +ʋ +w +z +p +u +õ +f +ɛ +ũ +ĩ +v +' +– +6 + diff --git a/full_models/mox/D_100000.pth b/full_models/mox/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f79f7074758206e005a45e1c7d0d551e5f26f47b --- /dev/null +++ b/full_models/mox/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b9ee14a5a6e39104e39ab56d7c12a19c1fa3a4e53f6f709c83cd50c2d2e35bf +size 561078848 diff --git a/full_models/mox/G_100000.pth b/full_models/mox/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0cc7ff39e8da87876f0b0e7d7b3c1774b89f4c02 --- /dev/null +++ b/full_models/mox/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27255d43d5590a69a91e8334b4c09ddb5c32521edb58742f61842ba5e59f683 +size 436373661 diff --git a/full_models/mox/config.json b/full_models/mox/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mox/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mox/vocab.txt b/full_models/mox/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ed9971a04106572521281a2b786098211fbd5dd1 --- /dev/null +++ b/full_models/mox/vocab.txt @@ -0,0 +1,36 @@ +h +2 +7 +_ +i +8 +3 +v +w +1 +0 +5 +q +t +o +- +l +y +u +a + +6 +e +k +m +s +9 +f +d +4 +ʼ +n +b +' +— +g diff --git a/full_models/moz/D_100000.pth b/full_models/moz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..119eecd9e89ef85b15fd8982c07dc751271b0fa5 --- /dev/null +++ b/full_models/moz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e80c2dab149c24f4ed4ee4880d30b54478703f213d814b647c1f85249d00ff +size 561079365 diff --git a/full_models/moz/G_100000.pth b/full_models/moz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..896e78755c0847151de1a24630e3f78b1daa5e8a --- /dev/null +++ b/full_models/moz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56ab45d2f5c92b29753429cfed8231f9d0c10d3150862b5b0af5793a0b10971 +size 436386876 diff --git a/full_models/moz/config.json b/full_models/moz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/moz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/moz/vocab.txt b/full_models/moz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f68f17e9a6eb7da03ae3026b562abf13bb37c438 --- /dev/null +++ b/full_models/moz/vocab.txt @@ -0,0 +1,40 @@ +ó +ɗ +- +u +̰ +ɓ +_ +b +w +j +h +ƴ +— + +â +û +l +a +n +ú +z +á +î +ŋ +s +t +m +r +ô +d +p +c +e +ʼ +k +í +g +y +i +o diff --git a/full_models/mpg/D_100000.pth b/full_models/mpg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5689808ab537a15e0f49f47ef2002201d82d9bb --- /dev/null +++ b/full_models/mpg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a474d0effd431d2bcf68f6c442e9984f3fdb6002ec30f96b27177f8ee67d62a9 +size 561078758 diff --git a/full_models/mpg/G_100000.pth b/full_models/mpg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa50eaf8b009793da80a02335fd61d9a86f85687 --- /dev/null +++ b/full_models/mpg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a45e8f90fb2e5dfd6bee670e3e78d016bb90b249d421bb4c78734697884dc6 +size 436388332 diff --git a/full_models/mpg/config.json b/full_models/mpg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mpg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mpg/vocab.txt b/full_models/mpg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ee9faacb3f551fec992475bfe44c5f62c3a17f39 --- /dev/null +++ b/full_models/mpg/vocab.txt @@ -0,0 +1,42 @@ +| +a +i +m +n +u +d +g +e +l +t +k +' +o +s +h +b +r +z +y +w +v +j +c +p +â +á +f +î +- +ä +ê +ï +û +ô +à +ì +ü +q +ö +x + diff --git a/full_models/mpm/D_100000.pth b/full_models/mpm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e2a986f86c575a6f8e0d51c1cfa7db674b0a882 --- /dev/null +++ b/full_models/mpm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59854c471c13f6bc354043dc46c5fe3aac2ea055cbc4fa64feaaec1f79259282 +size 561078615 diff --git a/full_models/mpm/G_100000.pth b/full_models/mpm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cb9ae53251603a5bdc823a5cd04fdb2201becea3 --- /dev/null +++ b/full_models/mpm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:333936bb395ab03bc4158216b9256e95b3b3b8b61410b9cddcdac59a8bbecba9 +size 436382751 diff --git a/full_models/mpm/config.json b/full_models/mpm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mpm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mpm/vocab.txt b/full_models/mpm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..746ce58121318c784874159f404afebe989bc2f3 --- /dev/null +++ b/full_models/mpm/vocab.txt @@ -0,0 +1,40 @@ +ɨ +i +_ +ū +p +' +í +a +d +ā +g +h +x +s +m +e +y +ī +b +ñ +é +n +̄ +v +z +l +q +c +k +j +t +u +ú +́ +r +o +f + +ó +á diff --git a/full_models/mpp/D_100000.pth b/full_models/mpp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..442c65d9c3e15d91d17b6f29db84a4306cdd0e3e --- /dev/null +++ b/full_models/mpp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42f44e92adb1e4e3a6a8d649dfcf39feb910035857fe9f8311bf1cf4915ebe83 +size 561078628 diff --git a/full_models/mpp/G_100000.pth b/full_models/mpp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..12c78ea25f6af34825adc2d1212340ccd5e72c30 --- /dev/null +++ b/full_models/mpp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac352fe06574bef7636c9e382ce65cacaea9268afd782ccd6fabc5d3262740a +size 436375856 diff --git a/full_models/mpp/config.json b/full_models/mpp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mpp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mpp/vocab.txt b/full_models/mpp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..44f7f608ee3abf06b38ec36246007265aec643d1 --- /dev/null +++ b/full_models/mpp/vocab.txt @@ -0,0 +1,37 @@ +_ +o +g +3 +l +i +4 +c +t +d +p +9 +u +­ +z +7 +n +b +a +2 + +5 +f +w +6 +' +k +e +h +1 +m +- +0 +r +s +8 +y diff --git a/full_models/mpx/D_100000.pth b/full_models/mpx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..875d7012c1c5e057a0166dfa4a99cbe4cd86091f --- /dev/null +++ b/full_models/mpx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e41a4f48c05406618799c9205abb272a3c76a7292f35396d648b83d8a55ffc81 +size 561078486 diff --git a/full_models/mpx/G_100000.pth b/full_models/mpx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a82c7c7c684754885a58546d4a9faec2ff6dfc16 --- /dev/null +++ b/full_models/mpx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5596be93d6c7b07ad312b42548bbf8011bff53058c67f32e20daa10f84bba6d +size 436362147 diff --git a/full_models/mpx/config.json b/full_models/mpx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mpx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mpx/vocab.txt b/full_models/mpx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bc98f8cac4e549800127a26f21bb9fc315c04416 --- /dev/null +++ b/full_models/mpx/vocab.txt @@ -0,0 +1,31 @@ +a +| +i +n +e +l +o +u +g +w +t +b +y +k +h +m +s +p +v +d +- +' +— +0 +1 +2 +6 +4 +3 +5 + diff --git a/full_models/mqb/D_100000.pth b/full_models/mqb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..35462c9c8c34ef7f08de151e1f7c1828f56a6b09 --- /dev/null +++ b/full_models/mqb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77f2fd56cb797a8873d06971882e9ee31a8b6f8830ebbd51408daabcf93aac7 +size 561078585 diff --git a/full_models/mqb/G_100000.pth b/full_models/mqb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..33600557be1219d3249541e6ce27c1632200ce2d --- /dev/null +++ b/full_models/mqb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5ceb68b7d364b78417fe7e6919c937aa8d345d5e5baa6bac12818048dd3a09 +size 436391984 diff --git a/full_models/mqb/config.json b/full_models/mqb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mqb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mqb/vocab.txt b/full_models/mqb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bd9a5047487b5d0724babc4fc87f7881482ad936 --- /dev/null +++ b/full_models/mqb/vocab.txt @@ -0,0 +1,44 @@ +| +a +n +ə +y +k +e +m +t +w +s +i +o +l +u +h +r +ɗ +b +à +g +d +p +z +c +j +v +f +ʼ +ɓ +â +̀ +̂ +ù +ì +œ +á +é +î +- +û +ò +2 + diff --git a/full_models/mqf/D_100000.pth b/full_models/mqf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..24ba4a91b9f09a979a01335abbc71176b9bd7d74 --- /dev/null +++ b/full_models/mqf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb04a776d845f6d256c0f06cb15b7894a2d78fb66ea450f5a40baf6d278515d1 +size 561078236 diff --git a/full_models/mqf/G_100000.pth b/full_models/mqf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4d69afb438403c2b9baa594927ae3e3ccd9d7abe --- /dev/null +++ b/full_models/mqf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f90552de059b4501ae73785b6bec92f3246cf3beda733ba7b2ef56ddda8e3b +size 436394417 diff --git a/full_models/mqf/config.json b/full_models/mqf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mqf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mqf/vocab.txt b/full_models/mqf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..578f51d7d5db7fc284f0f9da3ae62db51686407a --- /dev/null +++ b/full_models/mqf/vocab.txt @@ -0,0 +1,45 @@ +| +e +o +a +n +t +r +b +m +k +i +y +s +u +w +á +- +ò +ó +à +í +é +ù +è +ì +ú +0 +4 +1 +2 +l +5 +p +3 +6 +9 +7 +h +8 +d +j +c +' +g + diff --git a/full_models/mqj/D_100000.pth b/full_models/mqj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff1448ec24cf86f7741a2493b0ec28964164c2b0 --- /dev/null +++ b/full_models/mqj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c33721ef6bf09d505bc3459ac33cc0f2d0d5cfdb844773745f9223c93975513e +size 561078966 diff --git a/full_models/mqj/G_100000.pth b/full_models/mqj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f4dfa9991696e4dd9189da5357c588f8755b880 --- /dev/null +++ b/full_models/mqj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acdc4e5bdf5a76c03b636ca738ed6c48dd9e13e17690037f1f03921517a33214 +size 436379757 diff --git a/full_models/mqj/config.json b/full_models/mqj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mqj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mqj/vocab.txt b/full_models/mqj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b34cbbfa2f76edac1684e0eef5ffa3586907251c --- /dev/null +++ b/full_models/mqj/vocab.txt @@ -0,0 +1,37 @@ +j +- +d +z +8 +p + +l +2 +5 +h +m +n +s +1 +6 +e +y +7 +4 +3 +k +f +t +r +i +' +a +_ +b +w +u +o +9 +c +0 +g diff --git a/full_models/mqn/D_100000.pth b/full_models/mqn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8bcdc3399a56bff022ee34cdc62dbc5f6ac978f2 --- /dev/null +++ b/full_models/mqn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2365e85ea9a67110f1c2f81eafcf0e476c67f05df5f9efc03354e875e753cbe +size 561078743 diff --git a/full_models/mqn/G_100000.pth b/full_models/mqn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3aac55d287d731174ce68fd43b8203de5366be77 --- /dev/null +++ b/full_models/mqn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d067dbadac5e46cbd60361b13d532b5ea9e0787fb2462a82eee1d2438c99efe +size 436364303 diff --git a/full_models/mqn/config.json b/full_models/mqn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mqn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mqn/vocab.txt b/full_models/mqn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fc79b1b27f8ec3ff8cdb56da171761f68d7c7c29 --- /dev/null +++ b/full_models/mqn/vocab.txt @@ -0,0 +1,31 @@ +1 +3 +u +k +t +s +a +o +d +b +p +h +9 +g +c +j +r + +m +e +_ +z +l +f +i +- +n +y +' +4 +w diff --git a/full_models/mrw/D_100000.pth b/full_models/mrw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..627103afa572514af6420903c9a2fc5119dc8c38 --- /dev/null +++ b/full_models/mrw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa0ba5187542f74c957273b66584d92b260a8aeeaf0702c0eed9449e76b60a92 +size 561078737 diff --git a/full_models/mrw/G_100000.pth b/full_models/mrw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..383c3dfddb73c9199a85a13632b7d37ea6385bbc --- /dev/null +++ b/full_models/mrw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:181e8d5c191a8a31b5dfc3f9b922c01a05415eb965588e7eb58d918c2e0069ae +size 436342195 diff --git a/full_models/mrw/config.json b/full_models/mrw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mrw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mrw/vocab.txt b/full_models/mrw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e59c4021abca9b1769841f24b131be6528421c29 --- /dev/null +++ b/full_models/mrw/vocab.txt @@ -0,0 +1,22 @@ +a +| +n +o +i +k +s +g +e +m +y +t +p +r +l +d +b +w +h +' +- + diff --git a/full_models/msy/D_100000.pth b/full_models/msy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b1b2e4f7e731e244460b92ff257948be67ad1b9 --- /dev/null +++ b/full_models/msy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b4b543fd68d0dec6e47b408adbf06f9e2a375ac38ca423a0fa671369d6a0c4c +size 561078340 diff --git a/full_models/msy/G_100000.pth b/full_models/msy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b02970420ccdef9647078d28efa21bb0a023fa9 --- /dev/null +++ b/full_models/msy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc302a1807728de5e2de23e75b7524680784eee278b740b8be48fb9c65a063bc +size 436378157 diff --git a/full_models/msy/config.json b/full_models/msy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/msy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/msy/vocab.txt b/full_models/msy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..67432a1210a438b7b2a03c8d224f23985ed8c280 --- /dev/null +++ b/full_models/msy/vocab.txt @@ -0,0 +1,38 @@ +a +| +i +g +m +ɨ +r +n +e +h +z +u +k +b +o +t +v +d +s +p +f +l +j +0 +w +1 +2 +7 +4 +' +3 +y +5 +6 +9 +8 +- + diff --git a/full_models/mtd/D_100000.pth b/full_models/mtd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..be052c8ccdea807c33b52a532b6fb92495e5556c --- /dev/null +++ b/full_models/mtd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb554f726ada30ef77e8fb2e0d1b7017ac0aab954efb59ee0410efc7344cb19e +size 561076080 diff --git a/full_models/mtd/G_100000.pth b/full_models/mtd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bcf9c9a0767925de64bc5099af1bdca1e8fbad58 --- /dev/null +++ b/full_models/mtd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac2bae8336f3bdfa8c140107e22d603e8409a4a3367478c82cc9984834dfe03 +size 436329509 diff --git a/full_models/mtd/config.json b/full_models/mtd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mtd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mtd/vocab.txt b/full_models/mtd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bc01ec9c31893d8fa9348daeab9bdad7c295f2d6 --- /dev/null +++ b/full_models/mtd/vocab.txt @@ -0,0 +1,25 @@ +m +a +b +_ +- +t +r +y +c +i +o +s +g +p +h +ꞌ +d +l +j +e + +w +n +k +u diff --git a/full_models/mtj/D_100000.pth b/full_models/mtj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1abba96c7466371297ce734a0d909e27b4ca2432 --- /dev/null +++ b/full_models/mtj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41978967b75fc604eda1dfac59645eb852d1a16c1f20009aa2dcae55fdb1ce66 +size 561078607 diff --git a/full_models/mtj/G_100000.pth b/full_models/mtj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ef03b2a0047314c1f41a04fd536b5cbc7f1d82e --- /dev/null +++ b/full_models/mtj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5727ee016afc197a58a28464a5c791fe3755c32891a407688c66bc02bee56d8 +size 436364340 diff --git a/full_models/mtj/config.json b/full_models/mtj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mtj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mtj/vocab.txt b/full_models/mtj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..caefe28c5087556a55982cabdbeda533ba799ffc --- /dev/null +++ b/full_models/mtj/vocab.txt @@ -0,0 +1,32 @@ +o +e +y +j +k +h +t +r +0 +2 +f +n +s +i +' +z +g +u +d +4 +- +1 +c +a +b +l +m + +_ +w +6 +p diff --git a/full_models/mto/D_100000.pth b/full_models/mto/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a39ab3c0844206aeaf3a7d970817bd06e6eb6d4a --- /dev/null +++ b/full_models/mto/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a013c7fc44fd99c81b290e22091d4a4345398fd19b232f347b8d53cf3da923 +size 561076185 diff --git a/full_models/mto/G_100000.pth b/full_models/mto/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eed4e710a69fead90083582d787f07f868016112 --- /dev/null +++ b/full_models/mto/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fec0f6271499720dbb398e8069fcbe6f3d87f60feaa522000491518e35b198d1 +size 436364880 diff --git a/full_models/mto/config.json b/full_models/mto/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mto/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mto/vocab.txt b/full_models/mto/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3bd4c316aa4d4619dc0c34072691894aed7398d2 --- /dev/null +++ b/full_models/mto/vocab.txt @@ -0,0 +1,40 @@ +l +r +z +4 +e +i +q +h +ú +í +y +v +c +ó +_ +9 +0 +w +ñ +' +t +n + +s +o +u +k +p +d +̱ +f +a +x +é +b +j +m +1 +g +á diff --git a/full_models/muh/D_100000.pth b/full_models/muh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e153dee8d3c9acc61c06925f5bba901c1e34fc9f --- /dev/null +++ b/full_models/muh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc2bbc85c2bf5b78b71aa0a4d76363e4386a90f6ad28d6251172866338f6642 +size 561076196 diff --git a/full_models/muh/G_100000.pth b/full_models/muh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d6ceac8622f346001c3e3bfdb6fdc61bb0bc5e7c --- /dev/null +++ b/full_models/muh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:868e2f6b431fd894abcd5e6f4e9d5246d0b6ad6477e1bb9c8a588be0e99ac87c +size 436346561 diff --git a/full_models/muh/config.json b/full_models/muh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/muh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/muh/vocab.txt b/full_models/muh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d9651d4c3a68b025b55336a49b521b9805f87dde --- /dev/null +++ b/full_models/muh/vocab.txt @@ -0,0 +1,32 @@ +| +a +e +ü +n +k +g +i +r +t +m +b +d +w +l +y +u +f +p +o +ï +s +h +- +z +ö +ʼ +c +j +' +v + diff --git a/full_models/mup/D_100000.pth b/full_models/mup/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..42c8191d98a8574db7c340c8a773150065f65593 --- /dev/null +++ b/full_models/mup/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c346a2517d7e6559afdad88e46ab8eed499ed77938070cbe0fd4b7c81efd676 +size 561079398 diff --git a/full_models/mup/G_100000.pth b/full_models/mup/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..199a8e3e75db2c8827069f3091424296a6a24482 --- /dev/null +++ b/full_models/mup/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c265b2e1ac7620f9b67f0ad411944c6e1121a683cfa99ad77e4d89008cc9a12 +size 436426293 diff --git a/full_models/mup/config.json b/full_models/mup/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mup/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mup/vocab.txt b/full_models/mup/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e12bef0c552156dc35c13c5b40e53ed89ec25416 --- /dev/null +++ b/full_models/mup/vocab.txt @@ -0,0 +1,57 @@ + +अ +ऊ +ढ +ब +द +- +ई +ट +ा +उ +ज +ओ +फ +झ +इ +ठ +ञ +ो +ु +़ +ः +ऐ +स +म +ण +ं +ग +ध +_ +प +र +थ +े +ळ +व +ष +भ +् +य +त +' +छ +ह +‍ +क +ू +न +घ +ल +च +ए +आ +ी +ि +ख +ड diff --git a/full_models/mur/D_100000.pth b/full_models/mur/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5c8ad8d91b08fa5e3e0f49a84c84fdfc88185a85 --- /dev/null +++ b/full_models/mur/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe7a0d743d504741ff1c10956ab34650efbb264e2c24fb6b05c9ab659540545 +size 561078637 diff --git a/full_models/mur/G_100000.pth b/full_models/mur/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..51aa7cb17ea508c3dee164cf567469f850fc8d5c --- /dev/null +++ b/full_models/mur/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aab9a1b095cbb42b2799843b8bb3e6f932d5b7a252a1878c5557b68a1b9d0df8 +size 436373461 diff --git a/full_models/mur/config.json b/full_models/mur/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mur/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mur/vocab.txt b/full_models/mur/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1f3e11e1167d2d1edd388297a24b059df570d66c --- /dev/null +++ b/full_models/mur/vocab.txt @@ -0,0 +1,36 @@ +| +a +i +n +o +e +k +ɔ +t +l +u +ɛ +g +c +r +z +y +m +ŋ +b +d +w +j +s +v +p +ã +á +ḏ +ṯ +0 +1 +2 +5 +4 + diff --git a/full_models/muv/D_100000.pth b/full_models/muv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d128de5477e825e8461b62a8c7dcee26f208899b --- /dev/null +++ b/full_models/muv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d4a0675b086d6c17e71426f3f4753345952b82291652a8b7d9e8346e9663f27 +size 561078875 diff --git a/full_models/muv/G_100000.pth b/full_models/muv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7119dfe334f0839a6faa9560bb043ff4f6fb9c54 --- /dev/null +++ b/full_models/muv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6388f7ca4ae9473f519242507cde487b23d25a50d63f76c88e92eb0c7373f246 +size 436400670 diff --git a/full_models/muv/config.json b/full_models/muv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/muv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/muv/vocab.txt b/full_models/muv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..28ba02f77f186fe8afe97e8a065e6cc307432cb5 --- /dev/null +++ b/full_models/muv/vocab.txt @@ -0,0 +1,47 @@ +ഒ +് +അ +ട +ണ +ര +ൂ + +ള +ോ +ഏ +ല +ച +ീ +റ +ആ +4 +എ +െ +ം +വ +ഇ +ക +ഊ +യ +3 +പ +' +ർ +6 +ഞ +ഉ +ൊ +ങ +ഓ +േ +ന +0 +ു +ശ +ഈ +ാ +ി +മ +ത +_ +ൻ diff --git a/full_models/muy/D_100000.pth b/full_models/muy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c5bd24c8fd24a1ecbd08127ed4df44cbcf0b9f36 --- /dev/null +++ b/full_models/muy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d937faadbc60ca0b22aaa5aae1e5fb79635ebc0356b3cc8034b89169b2d7eba +size 561078637 diff --git a/full_models/muy/G_100000.pth b/full_models/muy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4c6330dcf67e4063bda48e5e6c508ab4b11abae2 --- /dev/null +++ b/full_models/muy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b657b574cb62bb93e75a3a3a91e2860faa148244a09c700172db64d8a512ff70 +size 436401486 diff --git a/full_models/muy/config.json b/full_models/muy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/muy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/muy/vocab.txt b/full_models/muy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..63a9af8de00ad573058284713b61280833ecc635 --- /dev/null +++ b/full_models/muy/vocab.txt @@ -0,0 +1,48 @@ +f +è +ə +d +̂ +ì +k +e +é +l +o +à +ù +̀ +_ +j + +z +t +ɓ +î +- +ê +g +ô +́ +a +h +y +í +s +ŋ +ò +á +c +ɗ +i +m +r +ʉ +w +b +u +â +p +n +ú +v diff --git a/full_models/mvp/D_100000.pth b/full_models/mvp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1869f785d62c85744d6f0e923182e093366881f1 --- /dev/null +++ b/full_models/mvp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32cc775ee17ffe3a9e9567e0739b131ec29ac7a99c5b88bc0a39ac247f0a3b0 +size 561078986 diff --git a/full_models/mvp/G_100000.pth b/full_models/mvp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ac1072e8aed0d4f525d1050e2942754369c8ff4 --- /dev/null +++ b/full_models/mvp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c58ba0e88581b4cf697bb789b3163d4b5344af6d63cfd6fee7dde6fed3b663b0 +size 436357932 diff --git a/full_models/mvp/config.json b/full_models/mvp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mvp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mvp/vocab.txt b/full_models/mvp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..de90a2d717686b944f0cf4183fbb7b27cc9bb607 --- /dev/null +++ b/full_models/mvp/vocab.txt @@ -0,0 +1,28 @@ +a +| +n +i +o +t +u +m +l +k +g +s +e +p +' +r +d +b +j +h +- +w +c +y +f +z +q + diff --git a/full_models/mwq/D_100000.pth b/full_models/mwq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b4757ec62319b6631150ba206dcd49e495b2f1c5 --- /dev/null +++ b/full_models/mwq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33da0f0ab5f1c324931eab7aacb98702d40979d82104afd08e6c94aa2ade7e9e +size 561078632 diff --git a/full_models/mwq/G_100000.pth b/full_models/mwq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cf5b4a610fe24cbeee2f4b828cef4fc8f65f61de --- /dev/null +++ b/full_models/mwq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ead01870c1d7c39ebc7c98f672dc05293aab89dd08dd476eafff9e0a4fb9f78 +size 436392021 diff --git a/full_models/mwq/config.json b/full_models/mwq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mwq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mwq/vocab.txt b/full_models/mwq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..070b4fecc4b4fd8adc432bf930ea33bfc5c34045 --- /dev/null +++ b/full_models/mwq/vocab.txt @@ -0,0 +1,44 @@ +| +a +i +n +h +k +u +g +c +m +e +t +w +p +ä +s +l +' +ü +b +o +v +y +d +z +r +j +- +f +x +è +é +ë +á +0 +6 +ô +4 +î +ç +1 +õ +q + diff --git a/full_models/mwv/D_100000.pth b/full_models/mwv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..191a1a222aab94625ffdb2177eff86c3a95648fd --- /dev/null +++ b/full_models/mwv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a083dcbba6d7a0752f51c1c9d557db6ec2344732ecd2c904b45bda5dfdd99e +size 561078890 diff --git a/full_models/mwv/G_100000.pth b/full_models/mwv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..44b1c1c0df0b92e9022de9d1540dd032c9853c39 --- /dev/null +++ b/full_models/mwv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:525c280ab1e386807dce36f8ef4e70ee7826c28a733c67a8d003982a09d74493 +size 436366392 diff --git a/full_models/mwv/config.json b/full_models/mwv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mwv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mwv/vocab.txt b/full_models/mwv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6c647834d1da41c72efe178541c3a6f515cd4233 --- /dev/null +++ b/full_models/mwv/vocab.txt @@ -0,0 +1,31 @@ +a +| +i +u +n +e +k +t +s +m +g +l +b +p +r +o +d +y +j +h +c +' +- +f +v +w +z +0 +4 +1 + diff --git a/full_models/mxb/D_100000.pth b/full_models/mxb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9ee06036d9a88fd6e2e556530f17d8d00740f621 --- /dev/null +++ b/full_models/mxb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d7a4a4bb0d289ac0b3d37f6545a40a8bfae4951e0ec8d6f95735dedc2a1663 +size 561078767 diff --git a/full_models/mxb/G_100000.pth b/full_models/mxb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..af445f31f69c63625c6fc10bd0020bf7d55399fe --- /dev/null +++ b/full_models/mxb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3306969c69e1bd49a85762bd3de2a74b55ec046a6eca5cd48f9389cf8070e932 +size 436399397 diff --git a/full_models/mxb/config.json b/full_models/mxb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mxb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mxb/vocab.txt b/full_models/mxb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8a548d8ea4cbe751d7195fcdbc6db9d7bb9a8984 --- /dev/null +++ b/full_models/mxb/vocab.txt @@ -0,0 +1,47 @@ +ñ +2 +r +e +k +̱ +ú +y +8 +é +0 +h +5 +s +' +_ +- +t +4 + +á +d +1 +q +i +6 +p +z +3 +í +b +l +9 +v +j +o +g +c +7 +u +a +f +x +m +ü +ó +n diff --git a/full_models/mxq/D_100000.pth b/full_models/mxq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c770da300011a009c541ca6b603764cc0012f973 --- /dev/null +++ b/full_models/mxq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39040a28ed16b4b774fbbcb798c1cfb0532f1468df60db012f8f39fb63a2dd4a +size 561078581 diff --git a/full_models/mxq/G_100000.pth b/full_models/mxq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ead36f88f0124217685f1a742f585d21b81f0512 --- /dev/null +++ b/full_models/mxq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4783e6130f5f6585e56cca20088b42a36844bbc0138349350d0c90559566c810 +size 436373666 diff --git a/full_models/mxq/config.json b/full_models/mxq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mxq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mxq/vocab.txt b/full_models/mxq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7089c0230198a83dfa07e07259f7d1fe538f28c4 --- /dev/null +++ b/full_models/mxq/vocab.txt @@ -0,0 +1,36 @@ +s +x +á +p +b +y +ó +w +i +e +́ +_ +ʉ +é +f + +̱ +— +u +z +m +r +o +d +t +k +a +í +l +' +n +ú +j +ñ +v +g diff --git a/full_models/mxt/D_100000.pth b/full_models/mxt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f0080f3a0941c342d14c5a25597acde391679347 --- /dev/null +++ b/full_models/mxt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b0766d895a0e245c9a88c0fed8d3a43af56cd5b95abd341953f74f4d5c10b1 +size 561078637 diff --git a/full_models/mxt/G_100000.pth b/full_models/mxt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a3a6c0ee6daa2c0fb05132543e8fa6ba2b4d0367 --- /dev/null +++ b/full_models/mxt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc96a36973fc59772ef4e68fd8658ccd7ca972434a3e7df811d53ca4722db04 +size 436376884 diff --git a/full_models/mxt/config.json b/full_models/mxt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mxt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mxt/vocab.txt b/full_models/mxt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ebef750268b48c019937b89f7dfe52d463dcb209 --- /dev/null +++ b/full_models/mxt/vocab.txt @@ -0,0 +1,37 @@ +i +q +ó +h +̱ +r +k +j +é +f +c +s +í +x +ṉ +z +ɨ +l +v +b +n +p +a + +u +ñ +o +m +́ +e +t +ú +d +_ +g +á +y diff --git a/full_models/mxv/D_100000.pth b/full_models/mxv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e54f4a1ede2c5484da1b9cfbc0b3832ab8281325 --- /dev/null +++ b/full_models/mxv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f04a03e62695628e4bb4038edd3f63661363b1e36b2d0ee9dd2408abb920af0b +size 561078623 diff --git a/full_models/mxv/G_100000.pth b/full_models/mxv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e65095cd54ff397793bbf9aea0b28cc56407f10e --- /dev/null +++ b/full_models/mxv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fbd21a46c4a2b9ee7fda0fc504770702deea1eb4d3eac0611c1d1bf06f27738 +size 436398783 diff --git a/full_models/mxv/config.json b/full_models/mxv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mxv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mxv/vocab.txt b/full_models/mxv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ae29440ff935b04813921644f03bdf9d494a22f1 --- /dev/null +++ b/full_models/mxv/vocab.txt @@ -0,0 +1,47 @@ +h +e +ò +o +v +l +u +j +s +ö +q +k +ù +é +f +à +g +p +_ +ï +í +ì +â + +è +r +̱ +ꞌ +t +ñ +á +î +ë +ü +d +n +ó +a +ú +x +b +m +ä +c +z +i +y diff --git a/full_models/mya/D_100000.pth b/full_models/mya/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f03c3eb29f075d493c6f3187bc83816af1027697 --- /dev/null +++ b/full_models/mya/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4d7245ceae433b4ce49f1b137f8dd4753d36e9e70732a688443eb0796b68fd +size 561078759 diff --git a/full_models/mya/G_100000.pth b/full_models/mya/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..106bd21cf1692baf9fff062d863b6c5258cd7723 --- /dev/null +++ b/full_models/mya/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ab311b552f6e65d66004194005309b44a9ce6e37690322d190c0cefeca9f64 +size 436426871 diff --git a/full_models/mya/config.json b/full_models/mya/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mya/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mya/vocab.txt b/full_models/mya/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..bb81ac28f3652206d1a38e5b7a1c9f727922fbcc --- /dev/null +++ b/full_models/mya/vocab.txt @@ -0,0 +1,57 @@ +် +ာ +ု +ိ +း +ေ +သ +က +င +တ +့ +မ +ြ +ည +ရ +အ +န +လ +ှ +ပ +စ +ခ +ျ +ူ +ွ +ါ +ထ +ဖ +ံ +ယ +ဆ +ီ +ဲ +ဟ +ဘ +ဝ +္ +ဉ +ဤ +ဇ +ဒ +ဂ +ဦ +ဏ +ဗ +ဓ +ဧ +ဥ +ဩ +ဌ +ဋ +' +ဣ +ဍ +ဿ +ဈ + diff --git a/full_models/myb/D_100000.pth b/full_models/myb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa93e610a9bdfb17309d9437031247801747c5cc --- /dev/null +++ b/full_models/myb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09a521207b66cff4f056ec13a36ff0f3c067485b8657e097bff1a15dec5a07b +size 561078961 diff --git a/full_models/myb/G_100000.pth b/full_models/myb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..13c4840ba35101fc260eb1de5944b142bedbac86 --- /dev/null +++ b/full_models/myb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f272d22723ac6c0cb0bae7437dfd9605a9f9b9a081b7b584adc0230f4d557d23 +size 436386588 diff --git a/full_models/myb/config.json b/full_models/myb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/myb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/myb/vocab.txt b/full_models/myb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5f7a63374a42522a19a9e02804c1ffc172f18dd2 --- /dev/null +++ b/full_models/myb/vocab.txt @@ -0,0 +1,40 @@ +| +a +n +k +ï +t +d +e +o +g +l +i +m +r +ø +j +u +b +s +' +h +y +ð +w +þ +î +õ +ã +p +é +ë +à +á +ü +ò +- +ó +ú +ù + diff --git a/full_models/myk/D_100000.pth b/full_models/myk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4f5c069d1b7b3b91c320cfae8110e38fd5efd6b --- /dev/null +++ b/full_models/myk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1482d6f351d6645e0d90c387961d81f3e49c18964043ae29fa0be2c8515ee9 +size 561078589 diff --git a/full_models/myk/G_100000.pth b/full_models/myk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..da4e68598f0556c3a09f8dd93636cbc0fa6d7a16 --- /dev/null +++ b/full_models/myk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd0e0ceef9eb0cd94436977dd8053e5c99c9e91eca4ef54b38aec6db173626d +size 436396721 diff --git a/full_models/myk/config.json b/full_models/myk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/myk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/myk/vocab.txt b/full_models/myk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e52349a6531dccdabdf08f6355be668301c2859b --- /dev/null +++ b/full_models/myk/vocab.txt @@ -0,0 +1,46 @@ +| +a +i +n +e +ɛ +u +w +y +k +p +o +g +l +b +r +m +s +ɔ +h +t +ɲ +d +f +ᴐ +ŋ +ʼ +j +c +' +z +x +` +è +à +v +á +ù +- +ì +í +é +ò +̀ +́ + diff --git a/full_models/myl/D_100000.pth b/full_models/myl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6dad609380222aed6c6d2467ea6ef880c5b2c35e --- /dev/null +++ b/full_models/myl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4b9ccb8b6ae8d3f3ab1c6a494fc241d75b4c5f1ca8709c832ac6e20a330d04 +size 561076020 diff --git a/full_models/myl/G_100000.pth b/full_models/myl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d8d7830b58f5879aaacaef9cf2cdbf5254fb893a --- /dev/null +++ b/full_models/myl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2982861e01251f600556f5418ff3491e9ddf531a2b1e304d73951b122b7c29 +size 436335957 diff --git a/full_models/myl/config.json b/full_models/myl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/myl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/myl/vocab.txt b/full_models/myl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..47619f591cf99897b5fc63a95bb992d8691fe348 --- /dev/null +++ b/full_models/myl/vocab.txt @@ -0,0 +1,28 @@ +k +b +d +– +n +t +c +z +h +j +y +u +i +m +l +p +g +e +' +- +o +a +_ +w +s + +r +f diff --git a/full_models/myv/D_100000.pth b/full_models/myv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8f3031deac3f3d7d8ba6f59869ac6c204b71beb0 --- /dev/null +++ b/full_models/myv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d89ea7c29f27a2b405552de32f8b5264a87f69898faaad076a95587d17c14116 +size 561079016 diff --git a/full_models/myv/G_100000.pth b/full_models/myv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f04625fa15105e18128625b3ef96ca6776f1af27 --- /dev/null +++ b/full_models/myv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55835a1c749e2c447fa29da39dbaed1432f454c072dd37acaed67563dd4053e0 +size 436377416 diff --git a/full_models/myv/config.json b/full_models/myv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/myv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/myv/vocab.txt b/full_models/myv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9a01a8dbd1388544108b4a9bb8a5d410537d6de5 --- /dev/null +++ b/full_models/myv/vocab.txt @@ -0,0 +1,36 @@ + +ш +м +ц +ф +т +_ +ы +к +ж +р +о +ё +ч +е +и +у +с +ь +э +а +в +н +з +л +й +г +щ +я +п +ю +д +- +х +б +– diff --git a/full_models/myx/D_100000.pth b/full_models/myx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ea4692e4c72cf3a1cedde534e1e7d0b49ecdf5d --- /dev/null +++ b/full_models/myx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c9f073532444044cbd0fbd212e3f191d8370ec8e6f4550db7dd5dba06a6f80 +size 561078611 diff --git a/full_models/myx/G_100000.pth b/full_models/myx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0fada999658dbaa1f6c829ca1a40cf5476209b18 --- /dev/null +++ b/full_models/myx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354208f0a71a1f723a98aa6bb5c12210486c6d6da530e81a988320f3979fd960 +size 436364465 diff --git a/full_models/myx/config.json b/full_models/myx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/myx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/myx/vocab.txt b/full_models/myx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a6713d28c4809cd81b4db2efdf92a4dab051a6d8 --- /dev/null +++ b/full_models/myx/vocab.txt @@ -0,0 +1,32 @@ +| +a +i +u +e +n +b +k +l +o +s +h +w +m +y +t +r +d +g +f +' +p +ŋ +j +z +v +- +0 +c +4 +1 + diff --git a/full_models/myy/D_100000.pth b/full_models/myy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..390ba3a3fc6b8d21adc7a21786732e2df7c526c8 --- /dev/null +++ b/full_models/myy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce8f54c1c2e16919d75f8e0a6819cb4929a87dbe8be7786675ff960429e5a0f +size 561078486 diff --git a/full_models/myy/G_100000.pth b/full_models/myy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..56f2178e0074cc8a04ac61a1a3c57a68b23a1d7a --- /dev/null +++ b/full_models/myy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa15b92a7a82371f5f916b6cfcebfacdeed51a60ba4afb8a135335c36b880e0 +size 436396624 diff --git a/full_models/myy/config.json b/full_models/myy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/myy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/myy/vocab.txt b/full_models/myy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..18088e4c21a4953747e65685d3fc0269d90be6fb --- /dev/null +++ b/full_models/myy/vocab.txt @@ -0,0 +1,46 @@ +̃ +g +b +õ +ñ +z +‍ +é +ʉ + +a +p +w +u +f +r +e +ũ +x +m +n +— +l +́ +ú +y +_ +ẽ +k +v +ó +t +q +s +' +ü +j +ã +h +d +o +c +i +ĩ +á +í diff --git a/full_models/mza/D_100000.pth b/full_models/mza/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c648cf1c6ba690d048634a404d9cde82226cda08 --- /dev/null +++ b/full_models/mza/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:625e46a3d30ec8d218d0b5664081b709d83a7fbd6bfce057ea53075a47ee9f00 +size 561078215 diff --git a/full_models/mza/G_100000.pth b/full_models/mza/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..750f7d2e412e926d755c54ccf62ae1c5bfcac636 --- /dev/null +++ b/full_models/mza/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfd14c11623b98f222c371cab2ad0cf35109ab95deb23c8bfe55bb9b1b4a471c +size 436405795 diff --git a/full_models/mza/config.json b/full_models/mza/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mza/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mza/vocab.txt b/full_models/mza/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cbf887d1e1f16200a085e18c9c20f068d7064f8d --- /dev/null +++ b/full_models/mza/vocab.txt @@ -0,0 +1,50 @@ +| +a +n +i +u +' +t +k +d +o +r +c +h +ñ +m +v +y +e +j +à +s +ù +ì +ā +ī +g +l +ü +̱ +x +ö +í +ū +p +á +ē +b +é +ú +ï +è +ä +ó +f +ō +z +ò +q +ë + diff --git a/full_models/mzi/D_100000.pth b/full_models/mzi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ca1b0f2c1546747ef8fa11c873893d52b3f4768 --- /dev/null +++ b/full_models/mzi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c08abcbc71029f01c6fa5f8fed3c8c77726c2975cc977afb22497188dcefb0 +size 561078591 diff --git a/full_models/mzi/G_100000.pth b/full_models/mzi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a6310bf305ccb56bd17ef2d7f2a0c84ef73da695 --- /dev/null +++ b/full_models/mzi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf431bcda10aacf6387c642e6f4ac348ad275b85a222dabcae792884b3cbb0b +size 436371374 diff --git a/full_models/mzi/config.json b/full_models/mzi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mzi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mzi/vocab.txt b/full_models/mzi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..78863efa3271812b63379a66a6d8b3d81ebd9dca --- /dev/null +++ b/full_models/mzi/vocab.txt @@ -0,0 +1,35 @@ +i +g +ó +a +ú +ñ +o +c +k +ń +̱ +h +y +ṉ +s +á +f +u +' +é +d +r +n +b +– +t +j +m +_ +p + +x +í +l +e diff --git a/full_models/mzj/D_100000.pth b/full_models/mzj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bc2499d2ca0c5a3cbf70cf8d98252d5950175a18 --- /dev/null +++ b/full_models/mzj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e74177de422f2efb4a3b4f6658a04cde02f52d9de14cd5d26c49cc90dafa06 +size 561076192 diff --git a/full_models/mzj/G_100000.pth b/full_models/mzj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..afa19437630fb242bf41a4030c638e1eb8b89e46 --- /dev/null +++ b/full_models/mzj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6c93c49f6dfd6f49f8429817a6b72e9c89c7d1ddc454eb29106433e55d3d1d8 +size 436348852 diff --git a/full_models/mzj/config.json b/full_models/mzj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mzj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mzj/vocab.txt b/full_models/mzj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9ac71a218b34dab0e9f8da824357aea0445f388f --- /dev/null +++ b/full_models/mzj/vocab.txt @@ -0,0 +1,33 @@ +m +ɔ +o +l +s +t +i +ɛ +z +̀ +v +' +ǹ +d +a +h +à +w +́ +e +y +b +p +n +u +ǃ + +f +g +ɲ +k +j +_ diff --git a/full_models/mzk/D_100000.pth b/full_models/mzk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..94a56ca0cea818189824e6e16abd2db284ffacbb --- /dev/null +++ b/full_models/mzk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d103b1e6871794726021e3ac3c115dcc7ed8dfc4a34ac7700254c22e1699969d +size 561078739 diff --git a/full_models/mzk/G_100000.pth b/full_models/mzk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d077038bfd14762753745c2b2efd831ea81d6dda --- /dev/null +++ b/full_models/mzk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c450077879c59c477585bd94e7fc39a9fe45da385bcf009c70c05b83666ba0cb +size 436387411 diff --git a/full_models/mzk/config.json b/full_models/mzk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mzk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mzk/vocab.txt b/full_models/mzk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e08523a0ea98f8753e7598c1a39a1f25292c75d8 --- /dev/null +++ b/full_models/mzk/vocab.txt @@ -0,0 +1,41 @@ +| +h +e +n +a +l +b +i +o +u +d +é +à +m +s +g +k +t +j +r +w +- +ò +è +y +c +á +ú +p +v +ó +ì +f +í +ù +' +z +x +1 +2 + diff --git a/full_models/mzm/D_100000.pth b/full_models/mzm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..af45a188f5091f6844e1a12dda4763010263754d --- /dev/null +++ b/full_models/mzm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed05166f347e0751f09811cd701ee11783b9742e5053d6fb9f6686dc47bcc49 +size 561078630 diff --git a/full_models/mzm/G_100000.pth b/full_models/mzm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6b854b5f5b6ee57715ed82fcfaa1d96b0d750f3c --- /dev/null +++ b/full_models/mzm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77126588b97a1f5254a052d20fe8fbf6eca66c17fe005207a3a74575c9850ea5 +size 436421933 diff --git a/full_models/mzm/config.json b/full_models/mzm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mzm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mzm/vocab.txt b/full_models/mzm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2674ee8609ab651f8b6f82cf9e6ea9a06f3ef292 --- /dev/null +++ b/full_models/mzm/vocab.txt @@ -0,0 +1,57 @@ +| +a +n +ɔ +ɛ +g +i +u +k +ɓ +r +t +e +s +z +y +l +p +w +o +d +b +h +m +v +ã +̃ +j +ì +̀ +́ +à +á +ũ +f +í +è +ù +é +ú +ñ +ò +ǎ +ń +ó +' +õ +ĩ +ǹ +ṹ +ǐ +̌ +ŏ +̆ +ň +- + diff --git a/full_models/mzw/D_100000.pth b/full_models/mzw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3b90b993812d476ec6689388ecf6c2d9c63cc52f --- /dev/null +++ b/full_models/mzw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175387975f9319639c74dce542d35242e9f7a341bf10fdc0adb69358e6c0b817 +size 561079139 diff --git a/full_models/mzw/G_100000.pth b/full_models/mzw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82a5dc52a8151413b2165bedfca08ca16ba2c1c1 --- /dev/null +++ b/full_models/mzw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a1ce94623d2fc66aba822486a7441f1e8a49ac85e9a43cfa1154bf985f5cb18 +size 436385415 diff --git a/full_models/mzw/config.json b/full_models/mzw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/mzw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/mzw/vocab.txt b/full_models/mzw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..86edc5726e4e4867022de1c8f98c24fcdc76aa3a --- /dev/null +++ b/full_models/mzw/vocab.txt @@ -0,0 +1,40 @@ +g +c +ń +ó +ŋ +- +k +é +ú +r +b +m +ô +́ +p +o +_ +s +â +d +j +e +l +v +u +w +h +' +n +ɛ +t +y +6 +å +a +f + +i +á +ɔ diff --git a/full_models/nab/D_100000.pth b/full_models/nab/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0092def51a34292536993671062a58e750f34cc0 --- /dev/null +++ b/full_models/nab/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c881e6f25f6a2ed2bdb514b9cb2adb95266ad97842cea1ede49516395716424b +size 561076163 diff --git a/full_models/nab/G_100000.pth b/full_models/nab/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d21a46bb6bea3371740c9212bdce962284b2f24c --- /dev/null +++ b/full_models/nab/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8319af29bdaa79016fd4a6a7f0bfd323b6ff386f66b2237d7eebea453b7c9b +size 436367005 diff --git a/full_models/nab/config.json b/full_models/nab/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nab/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nab/vocab.txt b/full_models/nab/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bbb7d753055de5a6c9108dc10883c8ca0af7ed3c --- /dev/null +++ b/full_models/nab/vocab.txt @@ -0,0 +1,41 @@ +v +' +6 +0 +k +u +j +i +ĩ +8 +7 +ẽ +̱ +m +e +a +w +— +2 +4 +f +t +ũ +s +õ +_ +y +n +l +r +1 +o +5 +3 +9 +x +h + +p +b +ã diff --git a/full_models/nag/D_100000.pth b/full_models/nag/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6232115d1d456186bd54d949a439eb9f01d260d8 --- /dev/null +++ b/full_models/nag/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f4e76e6ad42ef32bd32b5a8740d2ffae37543a38a7cbbf588c30e3b303b292 +size 561078894 diff --git a/full_models/nag/G_100000.pth b/full_models/nag/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d2c1c9c2b8044e5386decae777a75c470f3767c9 --- /dev/null +++ b/full_models/nag/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1f0deeb6f996fe0e057310acc176fdcdfb48b2a89dd0cc1b5fa48a6e0b71683 +size 436380264 diff --git a/full_models/nag/config.json b/full_models/nag/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nag/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nag/vocab.txt b/full_models/nag/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..97f09b778b38ba5eb2bf5ca0c2d62adab78c4593 --- /dev/null +++ b/full_models/nag/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +e +o +k +h +n +t +r +u +s +b +l +m +p +g +j +d +c +y +w +- +v +z +f +' +0 +x +4 +q +1 +5 +3 +2 +6 + diff --git a/full_models/nan/D_100000.pth b/full_models/nan/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..465703fe517761e85609c18c75efdf1bb22c3c30 --- /dev/null +++ b/full_models/nan/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e737daad6b0e2ebdacd0501141f7315cbbceb03a75357ec71447447fb5bd69a2 +size 561079001 diff --git a/full_models/nan/G_100000.pth b/full_models/nan/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7df86d16d8cfcfae5c7ce3367b8c168ce4d69aef --- /dev/null +++ b/full_models/nan/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f438a01baec513b4350d7562901aa9a2f5ad7b1333e45d8a544108a081dded +size 436405453 diff --git a/full_models/nan/config.json b/full_models/nan/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nan/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nan/vocab.txt b/full_models/nan/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dc6abee9ee61779de033b1d31807fc6da190c8f0 --- /dev/null +++ b/full_models/nan/vocab.txt @@ -0,0 +1,48 @@ +| +h +- +i +n +t +k +g +a +c +s +l +o +ê +̍ +e +â +ó +ō +p +ū +í +ā +á +u +ī +m +͘ +b +à +è +ò +ì +ô +ú +ù +î +ē +j +û +̄ +é +ǹ +̂ +ń +' +ḿ + diff --git a/full_models/nas/D_100000.pth b/full_models/nas/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bd41d8edb95a11b216b8789b6ff2a500d1edf1ae --- /dev/null +++ b/full_models/nas/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:861ad8649b78a982846b5bcbe661bbbcd4ec7858b254bb1adc90d3059ce72b50 +size 561078613 diff --git a/full_models/nas/G_100000.pth b/full_models/nas/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9211b7ab06167939d629da412c316bf38c7509f8 --- /dev/null +++ b/full_models/nas/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbb8d9503eac4283d5cb5db053eddac553a1bddbf50ee3b30c16adf838c94348 +size 436366785 diff --git a/full_models/nas/config.json b/full_models/nas/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nas/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nas/vocab.txt b/full_models/nas/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..683f87d8776d3c46f4299fc6025378bb4cb177cc --- /dev/null +++ b/full_models/nas/vocab.txt @@ -0,0 +1,33 @@ +a +| +n +o +i +e +' +k +u +t +r +g +m +p +d +- +v +b +s +j +l +0 +– +1 +6 +4 +2 +7 +8 +5 +3 +h + diff --git a/full_models/naw/D_100000.pth b/full_models/naw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..987983ce7a86b5f424388a8c404b9ef31253a14f --- /dev/null +++ b/full_models/naw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f392250be783037c149111a585367464b38e6f9701ada1df29de3e124539406a +size 561078875 diff --git a/full_models/naw/G_100000.pth b/full_models/naw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ef85250440c53f236e503b8f10c141e487223394 --- /dev/null +++ b/full_models/naw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d925537b138458660322b92b817c35a2b45faa2acd300387feed04ef3ce9d5cd +size 436366939 diff --git a/full_models/naw/config.json b/full_models/naw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/naw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/naw/vocab.txt b/full_models/naw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..42a21fd97f2d8d2c85c26d743fe2ae20d09d9cfc --- /dev/null +++ b/full_models/naw/vocab.txt @@ -0,0 +1,31 @@ +| +a +ɩ +n +ɛ +ʋ +m +k +i +b +ɔ +y +s +t +l +u +f +w +g +e +r +p +o +d +‐ +ŋ +h +' +á +́ + diff --git a/full_models/nca/D_100000.pth b/full_models/nca/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f368b8f6f0b70eccf8b5748b0e69beba8b2d0a4 --- /dev/null +++ b/full_models/nca/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55c260d69b49d4aabf4527b9201d932f8df3b69a893b55ae2725f4d02911aac7 +size 561078896 diff --git a/full_models/nca/G_100000.pth b/full_models/nca/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9704a43e83a772918b3a63e3f1031b5da674e49e --- /dev/null +++ b/full_models/nca/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02cd5a0e91ffaaac22c82c1d2ad9f5e72b5f9d75b4c18675410a00cb6515505e +size 436395691 diff --git a/full_models/nca/config.json b/full_models/nca/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nca/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nca/vocab.txt b/full_models/nca/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ad6ebebbe7fc441e5bb77314cfd293fb925d4828 --- /dev/null +++ b/full_models/nca/vocab.txt @@ -0,0 +1,44 @@ +q +g +o +i +f +v +1 +6 +8 +' +ú + +t +d +w +_ +u +n +a +ŋ +ó +j +2 +é +b +l +z +r +e +á +7 +m +3 +0 +y +4 +p +k +s +í +h +5 +9 +- diff --git a/full_models/nch/D_100000.pth b/full_models/nch/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..820a1b597b18aa2c107fcaeb2cf0ec387b81a7fa --- /dev/null +++ b/full_models/nch/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0738006d2a021ab149fbc7b1d557276388409cd5736f8f2a18d8507fcb3c17d3 +size 561078120 diff --git a/full_models/nch/G_100000.pth b/full_models/nch/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0fad83ab372c5288cb81a034d76c17bedc5c9c04 --- /dev/null +++ b/full_models/nch/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af95d8831afac3e38ca35164bb247a5f232d64739bcb82e71ecb8f784566b7d9 +size 436378196 diff --git a/full_models/nch/config.json b/full_models/nch/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nch/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nch/vocab.txt b/full_models/nch/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9f9c26c12e8e061b56b5ca8de35e6a8fc55c4757 --- /dev/null +++ b/full_models/nch/vocab.txt @@ -0,0 +1,38 @@ +a +| +i +t +u +n +c +e +o +h +m +q +l +j +s +p +y +r +x +z +í +d +ú +b +á +— +é +f +' +g +ó +v +0 +1 +2 +k +4 + diff --git a/full_models/ncj/D_100000.pth b/full_models/ncj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..03de398a5b03b8358b832678c7143f630597b53a --- /dev/null +++ b/full_models/ncj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239e27e453a08676994b202388ee7ae2f0256f12a3b64f2185268fa011e90dd4 +size 561078979 diff --git a/full_models/ncj/G_100000.pth b/full_models/ncj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..04fa4db5a1d0a2bceacc3a14ff520128b61c5ad6 --- /dev/null +++ b/full_models/ncj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620cb20479049f120bd57d6ba21aec13c27024d40975c0d5df12fad72f5f8a83 +size 436368838 diff --git a/full_models/ncj/config.json b/full_models/ncj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ncj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ncj/vocab.txt b/full_models/ncj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ccec9f5d3aac079ec6f55f027e9b787b6df4bf43 --- /dev/null +++ b/full_models/ncj/vocab.txt @@ -0,0 +1,33 @@ +| +i +a +n +u +t +h +o +e +c +l +q +m +s +y +p +x +d +z +j +r +ú +b +g +é +á +f +í +v +ó +k +ñ + diff --git a/full_models/ncl/D_100000.pth b/full_models/ncl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a872ad8d583c327897918e422571f0717fb6ca2 --- /dev/null +++ b/full_models/ncl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7853bb3b4823f04a4352bb1aa0ce6aafaf643351dd76fd34f8a431447694bac +size 561076182 diff --git a/full_models/ncl/G_100000.pth b/full_models/ncl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..115535152f2a82cbc2a140b123715448c2a929ae --- /dev/null +++ b/full_models/ncl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b2a4106f4fd8aa2add26bea0378e846a906b6738c384b0536749298593cca4 +size 436357956 diff --git a/full_models/ncl/config.json b/full_models/ncl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ncl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ncl/vocab.txt b/full_models/ncl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c660b0322f4fe3c11fc510a8c29df967ffbf8547 --- /dev/null +++ b/full_models/ncl/vocab.txt @@ -0,0 +1,37 @@ +ꞌ +h +l +v +n +o +m +g +f +z +0 +_ +ú +y +d +é +c +a +x +e +á +b +q +r +k + +p +u +2 +s +ó +j +í +t +i +— +ñ diff --git a/full_models/ncu/D_100000.pth b/full_models/ncu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0db97bbb4d83cf48dd595753dee1deb1e3b08565 --- /dev/null +++ b/full_models/ncu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c068605cc876aa82df6029bc57130991518edb49b3d578e264200595f7baaef7 +size 561076189 diff --git a/full_models/ncu/G_100000.pth b/full_models/ncu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..336594e3f490cae3facb2c5e27724306e2bb0fd8 --- /dev/null +++ b/full_models/ncu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d48ac5158a2ccb8d5eb80baaefc34b2a48a29bb46068be36b6deaf0cbaaa29 +size 436344356 diff --git a/full_models/ncu/config.json b/full_models/ncu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ncu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ncu/vocab.txt b/full_models/ncu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6af2fbca8eeed69100d5e8a3cbd373c3470a1fc7 --- /dev/null +++ b/full_models/ncu/vocab.txt @@ -0,0 +1,31 @@ +| +̱ +e +a +o +n +ɔ +m +y +k +b +s +r +i +ɛ +ŋ +w +- +u +t +f +p +g +l +d +ò +' +h +ʻ +ʼ + diff --git a/full_models/ndj/D_100000.pth b/full_models/ndj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bfd64181cacb0fe7dd554387c551081f3ac29341 --- /dev/null +++ b/full_models/ndj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b8dc254e3d3fcc6efc1c2a84e22f66cbc232d9a9d228a3d4a316833bfc5c84 +size 561078961 diff --git a/full_models/ndj/G_100000.pth b/full_models/ndj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e086676c06112aed1e4f6cf896d9bacd163826d --- /dev/null +++ b/full_models/ndj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2784d70a289e69add187ec710607c3d63f54965c08f249af5bc8ef8dd3ac037e +size 436356253 diff --git a/full_models/ndj/config.json b/full_models/ndj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ndj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ndj/vocab.txt b/full_models/ndj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fcf012654ebc52f1af6ea4321aaddf80a54be4a5 --- /dev/null +++ b/full_models/ndj/vocab.txt @@ -0,0 +1,27 @@ + +v +y +l +h +p +o +t +c +i +s +d +m +k +w +' +_ +b +r +z +f +g +u +a +e +n +j diff --git a/full_models/ndp/D_100000.pth b/full_models/ndp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d3c38a17a2cc72d3fa0c15f216a459ca86e84d74 --- /dev/null +++ b/full_models/ndp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec3712a09a856e0eb6403968f84056abffdc86d2928a9edd7d8d3398d14bdd53 +size 561110374 diff --git a/full_models/ndp/G_100000.pth b/full_models/ndp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3d5c42263d71705fa6361d2d03ad563d5e68c153 --- /dev/null +++ b/full_models/ndp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9246130d38dd1f2583282a124dffdebfa5c1d7f7e57ac0f3dbe5b412f46fcf5e +size 436592079 diff --git a/full_models/ndp/config.json b/full_models/ndp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ndp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ndp/vocab.txt b/full_models/ndp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..64b725a8caf41d814ce3b1e3e095ca2183ba9963 --- /dev/null +++ b/full_models/ndp/vocab.txt @@ -0,0 +1,26 @@ +| +i +a +o +e +n +k +u +r +m +d +b +' +t +y +l +s +z +g +w +p +h +v +f +- + diff --git a/full_models/ndv/D_100000.pth b/full_models/ndv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2389732bf5e6e838a0e12ac68ac8b2cab7c9406d --- /dev/null +++ b/full_models/ndv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:439c64dda971c2d16009dda6ae7baf03580ba792167dafc7072e49d5276861f2 +size 561079378 diff --git a/full_models/ndv/G_100000.pth b/full_models/ndv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..92e61cf3a3f0a6e0f524bdac69e733aa1d5d7df5 --- /dev/null +++ b/full_models/ndv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ebee21688e481a47344516d550009d96600881df844c0ea6d53b2fc6d41750 +size 436378197 diff --git a/full_models/ndv/config.json b/full_models/ndv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ndv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ndv/vocab.txt b/full_models/ndv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..19433c0bc98fb38645ff7a5c3afd1c19effb60d4 --- /dev/null +++ b/full_models/ndv/vocab.txt @@ -0,0 +1,35 @@ +c +m +r +g +o +t +s +b +i +h +- +y +w +d + +í +u +ɗ +ɓ +é +_ +f +ŋ +ë +j +l +a +k +ˈ +n +e +p +ñ +ƴ +ú diff --git a/full_models/ndy/D_100000.pth b/full_models/ndy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3c62d32eb1b5d6b88ab4487caddd0f135b37f679 --- /dev/null +++ b/full_models/ndy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01f570136e18d7f42694cd982531ccb109abce694e62d22f190511210a2aaed +size 561078754 diff --git a/full_models/ndy/G_100000.pth b/full_models/ndy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2c8ff6885437a937f423e5447fa817f8c0b8adc6 --- /dev/null +++ b/full_models/ndy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ea67f9c1bca0f1a109d792fa1eb0d0362227b99c33388ceeff36a93cd1dbc8 +size 436364163 diff --git a/full_models/ndy/config.json b/full_models/ndy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ndy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ndy/vocab.txt b/full_models/ndy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..249aaffc5c90c351556524a66017d3c9a55b75c1 --- /dev/null +++ b/full_models/ndy/vocab.txt @@ -0,0 +1,31 @@ +u +n +p +̱ +e +g +r + +t +_ +v +h +s +ɔ +b +w +l +ɗ +' +ə +i +y +a +k +f +d +j +o +m +ɓ +z diff --git a/full_models/ndz/D_100000.pth b/full_models/ndz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..34209d1c764639c0fa3089ea27a9e02fee863e60 --- /dev/null +++ b/full_models/ndz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd33eacaab77e5eb440f5b9cbc0605e2fa7711c03b854160825671b6a06add1 +size 561078637 diff --git a/full_models/ndz/G_100000.pth b/full_models/ndz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..794c7a2cebeb87846884d34bad5a2a2fdbe35b4a --- /dev/null +++ b/full_models/ndz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f025aeee6431a0f5e5c852becf44e9398b7dd7b1785266acfb88372a7184e59 +size 436410571 diff --git a/full_models/ndz/config.json b/full_models/ndz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ndz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ndz/vocab.txt b/full_models/ndz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c60362392a2f1d386e38a88459b8f7587cfa403a --- /dev/null +++ b/full_models/ndz/vocab.txt @@ -0,0 +1,52 @@ +| +n +í +d +b +t +a +ì +m +g +á +k +i +à +' +o +ó +e +ò +y +ù +u +j +â +è +l +c +ṛ +w +ú +é +v +z +- +p +î +s +û +ŋ +r +ô +ê +f +0 +1 +4 +2 +— +7 +8 +6 + diff --git a/full_models/neb/D_100000.pth b/full_models/neb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c80ebe6a1609c38f8aabf517c2d7363b1c1490b8 --- /dev/null +++ b/full_models/neb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f60441cf4bfcda2ee077d186836bd716c6a668e679f2cd1bdf1545765f621b +size 561078454 diff --git a/full_models/neb/G_100000.pth b/full_models/neb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..01c5d3b405d0d818ade193e47cf4191aa81cc675 --- /dev/null +++ b/full_models/neb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ddfbcb33bb7e6b1860c3f04f644d4610d0704c701670f14dbb94828b257c18 +size 436398916 diff --git a/full_models/neb/config.json b/full_models/neb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/neb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/neb/vocab.txt b/full_models/neb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2b9231d2400ea1869f1e5cd301aaec38907f6045 --- /dev/null +++ b/full_models/neb/vocab.txt @@ -0,0 +1,47 @@ +| +à +n +l +a +ɛ +e +i +k +g +w +á +b +̀ +' +o +ɔ +- +t +é +y +́ +p +ó +m +h +u +è +ò +s +z +d +í +ù +ɩ +ú +ʋ +̂ +f +ì +v +â +ê +î +ô +` + diff --git a/full_models/new/D_100000.pth b/full_models/new/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..33de94377b6704807401026c9347a96beecfd611 --- /dev/null +++ b/full_models/new/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a6eefa64c526f8aa3091562a7cd2a0ce3812a6d2642c0f7450e0a4435c86761 +size 561079002 diff --git a/full_models/new/G_100000.pth b/full_models/new/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f748622142107d96bbbb2e5a2d482649ed9430c1 --- /dev/null +++ b/full_models/new/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48750327fc8effe252cb583a0a6a0c169e04d7124e8b0d3a978159e7ba268f47 +size 436440716 diff --git a/full_models/new/config.json b/full_models/new/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/new/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/new/vocab.txt b/full_models/new/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9c398e18843828dfc2602545ef2213e7eaf9dc18 --- /dev/null +++ b/full_models/new/vocab.txt @@ -0,0 +1,64 @@ +क +स +२ +ो +ढ +े +म +छ +ँ +ठ +ट +ब +१ +ई +ज +ा +ओ +उ +थ +ञ +न +द +अ +ह +र +‍ +ए +ङ +ग +_ +ः +श +ै +० +' +ण +ख +६ +ू +् +ृ +व +झ +- +ं +य +प +फ +ऊ +भ +इ +ड +आ +ि +ध +ौ +च +ु +त +ी +ल + +ष +घ diff --git a/full_models/nfa/D_100000.pth b/full_models/nfa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d203868d9046df8d16f826671356fe7b687cd266 --- /dev/null +++ b/full_models/nfa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e028bb9286a28c941f4ac9f6756edaae1ac3ad38346bfd3ac05a4493133a3a3 +size 561076024 diff --git a/full_models/nfa/G_100000.pth b/full_models/nfa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed510aff172b57e8aa5a3def3a7bb66806276948 --- /dev/null +++ b/full_models/nfa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fab0dc20f519c58a3838e1a565f2d1ab6b68b4feba3a807391b0259737446f8 +size 436333624 diff --git a/full_models/nfa/config.json b/full_models/nfa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nfa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nfa/vocab.txt b/full_models/nfa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c5b61604d6890a1b24f0b5d3ec2c6e6d7dc5f3ec --- /dev/null +++ b/full_models/nfa/vocab.txt @@ -0,0 +1,27 @@ +c +t +p +_ + +- +e +i +g +' +y +k +r +d +m +s +j +w +n +u +f +l +b +è +h +a +o diff --git a/full_models/nfr/D_100000.pth b/full_models/nfr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..57286ad02820e8fd4d1dab24e8817e2fbad0ac6b --- /dev/null +++ b/full_models/nfr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6f87f1869275b5a43235929e78e551edd06504651cf595eec03ef7ae9f5eacd +size 561078719 diff --git a/full_models/nfr/G_100000.pth b/full_models/nfr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d1bbb7f24c5b45141afb5728e23b57b6c9ab2eb1 --- /dev/null +++ b/full_models/nfr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07beed6b0b3f6a5f5c3067543ec314a390517ca61890780dd4d676d5623aa1e +size 436364583 diff --git a/full_models/nfr/config.json b/full_models/nfr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nfr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nfr/vocab.txt b/full_models/nfr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..423a4a73fc1853c1de091466b858a1c3b654cd7d --- /dev/null +++ b/full_models/nfr/vocab.txt @@ -0,0 +1,32 @@ +| +a +n +e +i +r +k +u +m +y +ɛ +l +p +o +ↄ +b +w +t +s +ŋ +g +h +f +j +d +c +' +z +v +- +2 + diff --git a/full_models/nga/D_100000.pth b/full_models/nga/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a5bc6f50513adb1a4fe9f84af50075bafeb56955 --- /dev/null +++ b/full_models/nga/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e72b6d1079b99f06103c639a7cefd4b5e0d50ce53a2e2b80b995ae79328286 +size 561078734 diff --git a/full_models/nga/G_100000.pth b/full_models/nga/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7957e0f738b3ba4703d76bc953401a53cc4ad7f2 --- /dev/null +++ b/full_models/nga/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ce9cd53f1498c14a1c823b16e4f067a5331e29fbbf04bc2babafb2cd2b4525 +size 436394401 diff --git a/full_models/nga/config.json b/full_models/nga/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nga/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nga/vocab.txt b/full_models/nga/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8d473afba58d1950a7555fc8f8a77fd7c755e065 --- /dev/null +++ b/full_models/nga/vocab.txt @@ -0,0 +1,44 @@ +u +y +à +̃ +̀ +w +d +́ +ĩ +a +l +ã +t +n +ũ +ɛ +á +ì +k +ú +o +g +' +s +f +é +ò +è +m +_ +r + +- +z +ɔ +ó +i +ù +í +v +h +p +b +e diff --git a/full_models/ngl/D_100000.pth b/full_models/ngl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..011d05bc19fac25170a56dc6b5f7bcb73274e038 --- /dev/null +++ b/full_models/ngl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c2979d31dd1fdfa02b5453321cf529f58de65872e1b78df596c31e54a809f1 +size 561078842 diff --git a/full_models/ngl/G_100000.pth b/full_models/ngl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6b2be7ee2ae6b124909a0ec8d9701bcf27f02814 --- /dev/null +++ b/full_models/ngl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0953e5caa6348b2302eb9f18c83a5ff30d61b4bcf339af45d8b241a661f9a235 +size 436347222 diff --git a/full_models/ngl/config.json b/full_models/ngl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ngl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ngl/vocab.txt b/full_models/ngl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..964255be98e987923ce787ad730da5f79016fadc --- /dev/null +++ b/full_models/ngl/vocab.txt @@ -0,0 +1,23 @@ +l +h + +u +_ +- +t +p +y +r +s +i +m +o +c +v +n +a +e +k +' +w +f diff --git a/full_models/ngp/D_100000.pth b/full_models/ngp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8d3f1bc5fc19464e3507c02aa854d6f0acfa0a49 --- /dev/null +++ b/full_models/ngp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c5e604fa8c248fc36e70872476f477023050e743338781ad575683ba884bfb +size 561078969 diff --git a/full_models/ngp/G_100000.pth b/full_models/ngp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f6bf99325b830974f9c56d2af5a4c5575397fa51 --- /dev/null +++ b/full_models/ngp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ae9ff0dd611ca7a60ff98d82c21ee4d33fabcb76ee15b2184920cd4503f8f8c +size 436355528 diff --git a/full_models/ngp/config.json b/full_models/ngp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ngp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ngp/vocab.txt b/full_models/ngp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4a19940ee4e36d966d594d92ae7716a85d944e9d --- /dev/null +++ b/full_models/ngp/vocab.txt @@ -0,0 +1,27 @@ +' +v +r +b +t +k +u +w +_ +a + +y +m +d +g +l +j +h +z +o +i +c +p +f +e +s +n diff --git a/full_models/ngu/D_100000.pth b/full_models/ngu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..915f07bb4379c0ffc1dface84858ad1da3d003b4 --- /dev/null +++ b/full_models/ngu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:006364e9e379c6ad71feda36f341175d5fca5992297756e151322e753c9818d3 +size 561076176 diff --git a/full_models/ngu/G_100000.pth b/full_models/ngu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..df452c59fda139e9a538176d16f492bafc0c94b8 --- /dev/null +++ b/full_models/ngu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb6753e27b1c7b39cfa855cfce4381c777fd092dc6c39fef47b309608daf3d5 +size 436355782 diff --git a/full_models/ngu/config.json b/full_models/ngu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ngu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ngu/vocab.txt b/full_models/ngu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c88b60d71baa31f310d92acee43c70147b2cd8e9 --- /dev/null +++ b/full_models/ngu/vocab.txt @@ -0,0 +1,36 @@ +| +a +i +n +e +u +t +o +j +c +l +h +m +q +s +p +y +x +r +d +z +b +ú +á +í +g +ó +é +f +v +ñ +0 +1 +2 +k + diff --git a/full_models/nhe/D_100000.pth b/full_models/nhe/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b922ea512686744f5afd77e7239760fe9e0ab265 --- /dev/null +++ b/full_models/nhe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f975844e0f5ba1697a76c1fea04ea995cdd434a75ae1e447075ceb7aa3350fe +size 561076678 diff --git a/full_models/nhe/G_100000.pth b/full_models/nhe/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8152ea08005faa61c3bcbf044b46b5b8d9988c8a --- /dev/null +++ b/full_models/nhe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:430407144551861c77f43377ccd97e6850e60baae41c1a3a80be7c74a4fd550e +size 436368942 diff --git a/full_models/nhe/config.json b/full_models/nhe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nhe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nhe/vocab.txt b/full_models/nhe/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..94da1bcd06156107324f14cc435c09f726be0f7c --- /dev/null +++ b/full_models/nhe/vocab.txt @@ -0,0 +1,34 @@ +a +| +i +t +u +n +e +l +c +o +h +q +j +m +p +s +y +x +r +' +z +d +- +b +f +g +v +0 +1 +2 +k +4 +3 + diff --git a/full_models/nhi/D_100000.pth b/full_models/nhi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e45aecd66f77658e0afce4bb5d0652e279db8ebb --- /dev/null +++ b/full_models/nhi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:310ce19f73ff613e2aa3a9e8be625e54d13870525288c685aa96701cfc17aca1 +size 561078707 diff --git a/full_models/nhi/G_100000.pth b/full_models/nhi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ee6df1e0b650c91a9edb591ccc7df782622fd94d --- /dev/null +++ b/full_models/nhi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fae3f991793db6554ca0a51f39700cfa3e982707bec3db188a418952319537a +size 436376093 diff --git a/full_models/nhi/config.json b/full_models/nhi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nhi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nhi/vocab.txt b/full_models/nhi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..28158450ac4f7d8834c6db47d4c597e54c02cf07 --- /dev/null +++ b/full_models/nhi/vocab.txt @@ -0,0 +1,37 @@ +| +i +a +n +t +o +c +u +h +l +e +m +s +q +p +y +z +x +d +r +j +ú +í +— +b +é +g +v +f +ó +á +' +ñ +k +­ +- + diff --git a/full_models/nhu/D_100000.pth b/full_models/nhu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..90a3dc7a32a95fff02853365205cffb66f991fa0 --- /dev/null +++ b/full_models/nhu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa5083f777d6cd18f888195f65237414dc36805312e4abc0b7ce8992e156b2f +size 561078702 diff --git a/full_models/nhu/G_100000.pth b/full_models/nhu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..597dde9e93d95a88db6cf16cb75d74c187777dcb --- /dev/null +++ b/full_models/nhu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a77a20aab175ac8070ba9d349f143beb6168e64689455fdacb68748bc5121345 +size 436394532 diff --git a/full_models/nhu/config.json b/full_models/nhu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nhu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nhu/vocab.txt b/full_models/nhu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..42bf9d226a30d3974f9d0bf43ca81bca1bd981d8 --- /dev/null +++ b/full_models/nhu/vocab.txt @@ -0,0 +1,45 @@ +| +e +ɛ +n +o +b +u +w +i +k +a +y +m +l +v +s +t +f +ŋ +g +d +j +c +ú +ó +' +ù +ô +̂ +̀ +h +́ +ì +î +ò +è +í +p +é +á +à +û +â +ê + diff --git a/full_models/nhw/D_100000.pth b/full_models/nhw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..25bcb49201deb6fa2a8440c9dc2161b69595f8c4 --- /dev/null +++ b/full_models/nhw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e88c54d8654c38329d721414ae08884674ea40352b327a017e3d0562195d2cbb +size 561076208 diff --git a/full_models/nhw/G_100000.pth b/full_models/nhw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..51b896199f9a82bbabbcf787478468e054045e4e --- /dev/null +++ b/full_models/nhw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e846cd43560c5964c655e78233021a14898c147e3ad17f05bc5d97cc2efdc6 +size 436358339 diff --git a/full_models/nhw/config.json b/full_models/nhw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nhw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nhw/vocab.txt b/full_models/nhw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e600ad22476dbebd27e05f504a005af0e28c0845 --- /dev/null +++ b/full_models/nhw/vocab.txt @@ -0,0 +1,37 @@ +a +| +i +t +u +n +c +l +e +o +h +m +q +s +p +j +y +r +x +z +í +d +ú +b +á +— +é +f +' +g +ó +v +0 +1 +2 +k + diff --git a/full_models/nhx/D_100000.pth b/full_models/nhx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff3168fe7eca530700f2574cf6a800a564cd27fa --- /dev/null +++ b/full_models/nhx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909a029332b923481a3d443c6d5789e4b64690f894f84c6f63f21b502a72fc55 +size 561078360 diff --git a/full_models/nhx/G_100000.pth b/full_models/nhx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8862e5fabcac7b745ff97b641b4fc3d84443ff55 --- /dev/null +++ b/full_models/nhx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087f5dc0effe7774531da2774c5f2de7465d761a2d01e0f4adaae033147ac1f9 +size 436378786 diff --git a/full_models/nhx/config.json b/full_models/nhx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nhx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nhx/vocab.txt b/full_models/nhx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..738372418f2e8952f9d78437112c26310b420504 --- /dev/null +++ b/full_models/nhx/vocab.txt @@ -0,0 +1,39 @@ +| +i +a +̱ +n +e +j +k +o +t +m +y +w +s +l +' +á +p +g +c +h +d +r +u +x +z +ó +í +é +ú +‐ +b +f +— +v +q +ñ +3 + diff --git a/full_models/nhy/D_100000.pth b/full_models/nhy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8cb41f9bb655773f173788935f64538faeff147c --- /dev/null +++ b/full_models/nhy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e8279f6bd6e13c42581f6d6080048c5fa5e9178c6483030b3745cd3787805a +size 561078715 diff --git a/full_models/nhy/G_100000.pth b/full_models/nhy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a795d48365e9519cc350b45007e6516bb39c48ac --- /dev/null +++ b/full_models/nhy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890400d753e3b8c33e248327a2351618de18ec371bd4a8855dfb649b74743827 +size 436368963 diff --git a/full_models/nhy/config.json b/full_models/nhy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nhy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nhy/vocab.txt b/full_models/nhy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b7dad277da24749dd3c7746ae59401849668546b --- /dev/null +++ b/full_models/nhy/vocab.txt @@ -0,0 +1,34 @@ +z +o +h +x +u +ñ +j +t +f +p +y +r +é +c + +a +d +v +n +ó +e +b +á +ú +m +k +w +l +_ +í +i +g +s +q diff --git a/full_models/nia/D_100000.pth b/full_models/nia/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7d88babc528948a77da740812f26e784056bd0f7 --- /dev/null +++ b/full_models/nia/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b289de7dc80c436d055fde6247053d42068492db093b75c1f0258007cf23f392 +size 561079016 diff --git a/full_models/nia/G_100000.pth b/full_models/nia/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9e7ec0e705912aa0f8377ecbd17a59d10e2e1800 --- /dev/null +++ b/full_models/nia/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c7d8d490216e95dd98c6d38c7d3146c833bcc6f3633f26070919f1350e8af09 +size 436373593 diff --git a/full_models/nia/config.json b/full_models/nia/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nia/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nia/vocab.txt b/full_models/nia/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fea122991f9c4040bc67929cc1958fa5c30b4d7a --- /dev/null +++ b/full_models/nia/vocab.txt @@ -0,0 +1,34 @@ +| +a +i +ö +n +o +u +m +e +l +b +r +d +h +s +' +g +t +w +f +k +z +y +̃ +- +0 +p +j +2 +4 +6 +9 +1 + diff --git a/full_models/nij/D_100000.pth b/full_models/nij/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d8b74d1e7bcee79d3e64109f6d9b1e1a6545e5a2 --- /dev/null +++ b/full_models/nij/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb147e8200d947311e4cf200d52641ea425e16dc875d4f657dbb15b4ad87aa2 +size 561078893 diff --git a/full_models/nij/G_100000.pth b/full_models/nij/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..23bc968153b317190336f595c007711485d6a212 --- /dev/null +++ b/full_models/nij/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80161923b82c87f0de4a0a443cea78d544f545beb6c8d109fbccced00c30085f +size 436373006 diff --git a/full_models/nij/config.json b/full_models/nij/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nij/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nij/vocab.txt b/full_models/nij/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3e29632c6238a140d530fbc804d3b7e028e646d1 --- /dev/null +++ b/full_models/nij/vocab.txt @@ -0,0 +1,34 @@ +a +| +n +e +t +i +h +k +u +m +o +l +r +g +s +p +b +j +d +w +y +- +c +' +0 +z +4 +7 +5 +1 +2 +6 +f + diff --git a/full_models/nim/D_100000.pth b/full_models/nim/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5a0160f0d24daae726e30415969bbd93a5d624ed --- /dev/null +++ b/full_models/nim/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a351fdc1c91d57dd179226ab066368edf1af8a404d7bf345dde362d2345571d +size 561078752 diff --git a/full_models/nim/G_100000.pth b/full_models/nim/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3b91a4f84b322de0da953cd57aa1ddd26d173fc9 --- /dev/null +++ b/full_models/nim/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8689c47bff1421d033327405a56461f431653f5520691ff7db6569a3037a1356 +size 436365936 diff --git a/full_models/nim/config.json b/full_models/nim/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nim/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nim/vocab.txt b/full_models/nim/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e66b07292c417d3ad357b6a20ccfac6631df41a0 --- /dev/null +++ b/full_models/nim/vocab.txt @@ -0,0 +1,31 @@ +a +| +u +n +i +ĩ +k +l +e +m +o +g +t +s +ũ +w +p +y +z +d +b +h +j +- +' +f +r +0 +2 +4 + diff --git a/full_models/nin/D_100000.pth b/full_models/nin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c897fce95929c148bcb191a1052b0dd2d34027dc --- /dev/null +++ b/full_models/nin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803bb8120f61d667781e5f412018007133d1749e96556214082e8542cb334c8b +size 561078849 diff --git a/full_models/nin/G_100000.pth b/full_models/nin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b2211a7e4c2b48798dc2ffb7b701f032633dfc4 --- /dev/null +++ b/full_models/nin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a3162c7f5bb9642443ee143f50cfb0a907bbdf9aeea5c4bd091c5b2d80dc8da +size 436404846 diff --git a/full_models/nin/config.json b/full_models/nin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nin/vocab.txt b/full_models/nin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..10bda61bba4ce00d5397b57d5758d761c127613c --- /dev/null +++ b/full_models/nin/vocab.txt @@ -0,0 +1,48 @@ +a +_ +l +h +i +o +á +p +j +s +ù +b +k +g +v +à +y +̱ +ò +n +t +ě +u +î +ā +ú + +z +d +â +e +ɨ +û +é +- +' +ī +̀ +ǎ +ū +è +ì +m +í +r +c +f +w diff --git a/full_models/nko/D_100000.pth b/full_models/nko/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8410006444d4356c5768a15251a785e1d9667576 --- /dev/null +++ b/full_models/nko/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0787c6b3d58f810eb68eb1481c562e3c88b2e2954d6e3e3c4c9ee743a109598 +size 561079491 diff --git a/full_models/nko/G_100000.pth b/full_models/nko/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eb8055fdcc78b17093fc8ba1e1674fff580c2d23 --- /dev/null +++ b/full_models/nko/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac25fd25e42afc5bbfea73f51f02e8eaaddcf588b4f8f4ec2860ba6da4dfefe +size 436379011 diff --git a/full_models/nko/config.json b/full_models/nko/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nko/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nko/vocab.txt b/full_models/nko/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fc4d5e8b4418f4a441c395d3775e3b89599b5af0 --- /dev/null +++ b/full_models/nko/vocab.txt @@ -0,0 +1,36 @@ +y +p +n +á +ɔ +s +h +ŋ +é +o +í +a +- + +k +r +ɛ +ʋ +— +t +́ +m +ó +e +u +b +g +l +i +ɩ +' +_ +f +w +d +ú diff --git a/full_models/nlc/D_100000.pth b/full_models/nlc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4ed379f18546546bc1efe0cc792029dc575b19d9 --- /dev/null +++ b/full_models/nlc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853d6ac587cbfaf33ab3b5674b364f297f1d040428ab9d4a572d6e69b38d5623 +size 561078634 diff --git a/full_models/nlc/G_100000.pth b/full_models/nlc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b34f0261d4043af9a364407bcaec37a3489e8e8 --- /dev/null +++ b/full_models/nlc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc6ccbcdf7bcf3163aff6b9a42bfa893b51cd5b467bf908df9601bf43bb2522 +size 436369105 diff --git a/full_models/nlc/config.json b/full_models/nlc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nlc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nlc/vocab.txt b/full_models/nlc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3f39ab5b317ad060d700e1e27c7112f619bde4f2 --- /dev/null +++ b/full_models/nlc/vocab.txt @@ -0,0 +1,34 @@ +4 +e +` +l +o +n +p +f +m +2 +w +k +d +u +h +i +3 +0 +_ +y +c +a +z +j +t +' +s +b + +r +- +v +1 +g diff --git a/full_models/nld/D_100000.pth b/full_models/nld/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..25d4dcce9d65c12e24eae2f507d515fcc23704ac --- /dev/null +++ b/full_models/nld/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134d99fb55ce04610acd1eb86551c3a5f24f963c114ecd7831b48e733847834f +size 561110250 diff --git a/full_models/nld/G_100000.pth b/full_models/nld/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..59fa1ebcfb235be172e27c2add9256166912b1bf --- /dev/null +++ b/full_models/nld/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e8bacbc262209493cba57f57bd758f7f3cd9b8973d63f2182d3a9c02cafdb4 +size 436625856 diff --git a/full_models/nld/config.json b/full_models/nld/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nld/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nld/vocab.txt b/full_models/nld/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..632977b9b1773234c5e84a81a34813456f89aac6 --- /dev/null +++ b/full_models/nld/vocab.txt @@ -0,0 +1,41 @@ +g +s +- +– +ó +i +_ +q +v +w +j +h +ü +y +è +m +z +ï +b +é +n +u + +k +l +ë +í +o +p +c +á +r +a +f +ä +d +ú +' +t +x +e diff --git a/full_models/nlg/D_100000.pth b/full_models/nlg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f30eccb61bedaf4faeae57a6466176d7dc71be6c --- /dev/null +++ b/full_models/nlg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf30c7f8c70a97ac46e96180155a256b4181b760507806a30ab319b5cdd9eead +size 561078842 diff --git a/full_models/nlg/G_100000.pth b/full_models/nlg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c80697e689a1a8b022adc22a9e0b4f16dfd303bb --- /dev/null +++ b/full_models/nlg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61de574dfb83e6fbae1a82c390d4187e2b386a4fded38a437351b028064c0ca3 +size 436362241 diff --git a/full_models/nlg/config.json b/full_models/nlg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nlg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nlg/vocab.txt b/full_models/nlg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..45855c3d70d8438d3d9765fddf8dedb8d918d10b --- /dev/null +++ b/full_models/nlg/vocab.txt @@ -0,0 +1,30 @@ +r +d +- +p +v +j +o +f +e +i +q +g +n +c +u +k +w +t +h +b +s +m +z + +_ +a +' +y +x +l diff --git a/full_models/nlk/D_100000.pth b/full_models/nlk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aa0bb98fd1f3377a3cec237469a16e92a7655a25 --- /dev/null +++ b/full_models/nlk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9a39b03be1c72a8e491cdc81f2e23d30cd2ce5be1e2ab0436df9737cd690ab8 +size 561078634 diff --git a/full_models/nlk/G_100000.pth b/full_models/nlk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c3340404f6e9ae7a1f93bb19cd6e6797f3ece227 --- /dev/null +++ b/full_models/nlk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a024a8c3466c9e343e5e127edad60afb736ed09a69670e5b06708b5883ef66f9 +size 436373695 diff --git a/full_models/nlk/config.json b/full_models/nlk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nlk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nlk/vocab.txt b/full_models/nlk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..53fcfb99a7907bbc57f31f9d4be7903abda7cc51 --- /dev/null +++ b/full_models/nlk/vocab.txt @@ -0,0 +1,36 @@ +m +c +0 +z +5 +t +r +s +j +o +i +f +g +e +d +6 +u +w + +n +p +2 +9 +k +a +4 +3 +_ +y +l +b +8 +1 +7 +h +- diff --git a/full_models/nmz/D_100000.pth b/full_models/nmz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1a55b9218e72a4207f9efd118397242ce384bb8e --- /dev/null +++ b/full_models/nmz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57cc958ebb68e12dc9c03634dc23e06d288172f74b5fb5bf598597c319244111 +size 561079258 diff --git a/full_models/nmz/G_100000.pth b/full_models/nmz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..15cf374051f990ecde571c8ede8fb1ee283f0f6a --- /dev/null +++ b/full_models/nmz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cf280c9940fe2c08f10b5e7fdd4e7d2cf2678d61d37378504eb5f0cf44f681 +size 436398095 diff --git a/full_models/nmz/config.json b/full_models/nmz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nmz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nmz/vocab.txt b/full_models/nmz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..14842e31670f2954ad222b3b667d95a336d7286e --- /dev/null +++ b/full_models/nmz/vocab.txt @@ -0,0 +1,44 @@ +s +m +ù +g +– +y +c +r +f +e +' +k +a +ɔ +1 +v +j +u +_ +ú +i +ì + +d +í +à +ɛ +- +w +p +` +o +2 +ĥ +l +á +t +ɦ +́ +n +ŋ +̈ +h +b diff --git a/full_models/nnb/D_100000.pth b/full_models/nnb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fbed1c10c292516aa730ca7f37ef8cf3a66d1be4 --- /dev/null +++ b/full_models/nnb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd07b529fc60f5a45aef76e317250918c281ab1448212e0171ecaf8ac668d98e +size 561078995 diff --git a/full_models/nnb/G_100000.pth b/full_models/nnb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4c51858cec766785d0db9bc16c10806dda033fc2 --- /dev/null +++ b/full_models/nnb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf739641b65506bfa13a54db5f16e0f53e99e40041ce57ec9c0ecc39aefde739 +size 436375763 diff --git a/full_models/nnb/config.json b/full_models/nnb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nnb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nnb/vocab.txt b/full_models/nnb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a75a7d1368f11b48b4373909f888a01566a3f105 --- /dev/null +++ b/full_models/nnb/vocab.txt @@ -0,0 +1,35 @@ +a +| +n +e +o +b +y +m +k +i +u +ĩ +r +w +s +l +g +t +ũ +ʼ +h +d +z +p +- +f +­ +0 +v +1 +j +c +2 +3 + diff --git a/full_models/nnq/D_100000.pth b/full_models/nnq/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..292542a7a31977098551efcdf096fdf635a11b8f --- /dev/null +++ b/full_models/nnq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083f004c453cbbbe7cad8a3698b4eabf60557589c5f2a67ff501d2c69b29bf26 +size 561078981 diff --git a/full_models/nnq/G_100000.pth b/full_models/nnq/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..afbee2a22385878f566d3e2855a525410e12b1ba --- /dev/null +++ b/full_models/nnq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8059861b09daf5bb0be2fbc86ffc59227d4b07a2ee3d928ecfd84cb817901302 +size 436355228 diff --git a/full_models/nnq/config.json b/full_models/nnq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nnq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nnq/vocab.txt b/full_models/nnq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2d70537bd7a42ef5c20d6dfe49ba3b78b20deb82 --- /dev/null +++ b/full_models/nnq/vocab.txt @@ -0,0 +1,26 @@ +a +| +n +e +i +u +k +o +g +m +b +l +w +t +j +p +d +h +y +c +s +' +f +z +v + diff --git a/full_models/nnw/D_100000.pth b/full_models/nnw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..13e955b9eba20c7ebfdd6781c088cd7831e2f5bf --- /dev/null +++ b/full_models/nnw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81359fbe5738fcc3221e9878e8da6f584bbd15baa673256913ba9ad4398b33b7 +size 561078718 diff --git a/full_models/nnw/G_100000.pth b/full_models/nnw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9768a0ae5eb704dc546c98c4b51be2c3952e88cb --- /dev/null +++ b/full_models/nnw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c00f0b72a869410b3e9eb2962c7efacd1448d323a18a9cc211a598ff2db310cb +size 436415010 diff --git a/full_models/nnw/config.json b/full_models/nnw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nnw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nnw/vocab.txt b/full_models/nnw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..faec2dd9ac03810d60a1df7241800d8494af9c04 --- /dev/null +++ b/full_models/nnw/vocab.txt @@ -0,0 +1,54 @@ +| +ɑ +ə +n +ɩ +ʋ +̀ +t +́ +w +y +b +d +k +i +m +l +s +r +u +z +p +o +ɡ +c +ŋ +ɛ +ì +a +j +e +í +f +ń +- +á +ú +v +ù +ý +à +' +g +ɔ +ò +1 +h +ó +è +é +0 +̌ +2 + diff --git a/full_models/noa/D_100000.pth b/full_models/noa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..358b391cb150175913962056ea2ad95156ccdf13 --- /dev/null +++ b/full_models/noa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:768702aae1c7912e63aafc7d804f373e6a1510868b10d5cfc8330ccaf6bdc908 +size 561076173 diff --git a/full_models/noa/G_100000.pth b/full_models/noa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..989d8499ee934f04f895e6a633e4369a405f1d44 --- /dev/null +++ b/full_models/noa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0a56cc9dfe14b4b1888ec4568ff698c1c377ffe893a6e4b1f1cf78dbc92f10 +size 436383395 diff --git a/full_models/noa/config.json b/full_models/noa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/noa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/noa/vocab.txt b/full_models/noa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a186571bb0369e5178cd9db94c5d6bac5c020ee5 --- /dev/null +++ b/full_models/noa/vocab.txt @@ -0,0 +1,48 @@ +a +| +h +i +m +r +u +ʌ +e +j +' +n +g +c +p +k +d +t +w +b +o +ã +s +ë +ö +ĩ +̈ +ẽ +õ +ũ +l +̃ +y +á +ú +í +— +ä +é +f +v +ó +z +ñ +́ +q +x + diff --git a/full_models/nod/D_100000.pth b/full_models/nod/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9fa070a4c6163e839e00afdff6e4d0a816a6647e --- /dev/null +++ b/full_models/nod/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da8516bed5bc68d2cc053a1bd4484f092c120ed9be01e3d75d50425e4242ac29 +size 561079227 diff --git a/full_models/nod/G_100000.pth b/full_models/nod/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f04f33e041f513f1a9fd361db31c27748457fceb --- /dev/null +++ b/full_models/nod/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27abcbde38476691dee1ea79958a19caa66d3c2a6b3efd027b9fbb479b3300b +size 436448379 diff --git a/full_models/nod/config.json b/full_models/nod/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nod/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nod/vocab.txt b/full_models/nod/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..50de080d527bf39f50992236100c2c4551091196 --- /dev/null +++ b/full_models/nod/vocab.txt @@ -0,0 +1,66 @@ +า +้ +น +อ +เ +่ +ต +ก +ง +ย +ั +ม +| +ห +ี +ว +จ +ร +ะ +บ +ู +๋ +ค +ป +ข +ด +ื +ิ +ล +ส +พ +แ +ไ +ใ +ฮ +์ +็ +ผ +โ +ึ +๊ +ุ +ํ +ถ +ญ +ซ +ท +ธ +ษ +ฟ +ณ +ศ +ภ +ฝ +ช +ฐ +ฆ +ฉ +ฤ +ฏ +ฎ +ฒ +ฑ +' +ฬ + diff --git a/full_models/nog/D_100000.pth b/full_models/nog/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3d6522acc1a021a2b6233ff7bf7b72f0231991a2 --- /dev/null +++ b/full_models/nog/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4719da24c76c8a7fc2ab345f8c2e1b3c21e8bcb671f5aa081d66ab1e1a512ac +size 561079368 diff --git a/full_models/nog/G_100000.pth b/full_models/nog/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e2fbe9a00752809f7a8585927f3ce8584c331b7 --- /dev/null +++ b/full_models/nog/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ea18fab8c5cf0ef6f3c6c32f0d50e4045e0b9d369ad4dd7aeb9c6db7ac6de4 +size 436392409 diff --git a/full_models/nog/config.json b/full_models/nog/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nog/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nog/vocab.txt b/full_models/nog/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9dc6089417b4d29a81ceaac762cd6ec21431926c --- /dev/null +++ b/full_models/nog/vocab.txt @@ -0,0 +1,42 @@ +ф +и + +2 +х +с +ъ +э +л +у +– +0 +в +ш +к +о +г +- +р +п +н +т +1 +й +6 +ы +ь +3 +б +д +ю +е +4 +а +ц +м +' +ч +з +я +ж +_ diff --git a/full_models/not/D_100000.pth b/full_models/not/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d9886bcea499705557a4c601863993219da0135a --- /dev/null +++ b/full_models/not/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea002f2f292fb1adbece8231450cee480e2bd2b22d05fe21ec3c032fa538a71a +size 561078584 diff --git a/full_models/not/G_100000.pth b/full_models/not/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3a28f74fdd30f16a286a184aae716f83b41f65f --- /dev/null +++ b/full_models/not/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e4da6e70f381d6e0f7c247d85a78d8d2b27da4717ca22a50a515439d3995b08 +size 436385195 diff --git a/full_models/not/config.json b/full_models/not/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/not/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/not/vocab.txt b/full_models/not/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d10095c083bb574ef019bdc25964a1ca1834fcb6 --- /dev/null +++ b/full_models/not/vocab.txt @@ -0,0 +1,41 @@ +0 + +8 +á +6 +c +ó +b +p +l +1 +q +v +2 +j +r +— +ë +m +t +o +d +' +n +3 +é +9 +s +h +í +7 +z +5 +i +y +a +e +4 +g +u +_ diff --git a/full_models/npl/D_100000.pth b/full_models/npl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..04d57082e5e0d36332e31d8ac8ec0bc6862f1bfa --- /dev/null +++ b/full_models/npl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b002bef726f9097b586d4af89d799410bb7591c05ecce558857627785cb264b +size 561078973 diff --git a/full_models/npl/G_100000.pth b/full_models/npl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e32cee3837e136072ffb5bda2e5f8739dc91478 --- /dev/null +++ b/full_models/npl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0eefd893218c33f3064d4cc0edbe131b0d8046e239cd07d390851a91a5ec01c +size 436378843 diff --git a/full_models/npl/config.json b/full_models/npl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/npl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/npl/vocab.txt b/full_models/npl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..371f051645208203d5d1e2be6b39eff47b5cbe8a --- /dev/null +++ b/full_models/npl/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +k +o +t +n +e +l +h +m +s +w +j +c +p +y +r +u +d +x +ó +í +á +ú +é +b +— +g +f +v +z +q +ñ +' +- + diff --git a/full_models/npy/D_100000.pth b/full_models/npy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c0f8fdfe1b1cf2f70347cf8286c7634f246fd68c --- /dev/null +++ b/full_models/npy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce50801f03e9296b70fbc666e81b745bd1e50e80be5a7e1671e72fc1ac86409 +size 561078972 diff --git a/full_models/npy/G_100000.pth b/full_models/npy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..de29f7cf347d98f8753cb760149771af983e54f9 --- /dev/null +++ b/full_models/npy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c003e8e6b792d7420fa8e11b36b3a80c3482e07afb72bfccd9ae26b7ca1863a +size 436354653 diff --git a/full_models/npy/config.json b/full_models/npy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/npy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/npy/vocab.txt b/full_models/npy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..576a034cd5e45c34dace6ba48055dfee0e1f0205 --- /dev/null +++ b/full_models/npy/vocab.txt @@ -0,0 +1,26 @@ +a +| +i +n +u +o +e +m +l +p +h +t +k +r +d +g +b +s +w +y +- +' +j +f +c + diff --git a/full_models/nst/D_100000.pth b/full_models/nst/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c5f6cf87d9ba2fce5b8ca4f912b314ca0c3d7d74 --- /dev/null +++ b/full_models/nst/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137a446ab51a12fa9a3ed04a357e20c5114dad5f34cbaa27f922c7711d7d5ce4 +size 561076187 diff --git a/full_models/nst/G_100000.pth b/full_models/nst/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49f3d0ebd0e801000b6a9b4228f16abfeb3eee71 --- /dev/null +++ b/full_models/nst/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:242bc43ee562da2c9947f868c33efbbe13311abbe2e4ea4a29564e3f5399b67f +size 436335159 diff --git a/full_models/nst/config.json b/full_models/nst/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nst/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nst/vocab.txt b/full_models/nst/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..96d1178ea5bb9296a62b0503e5aa0744a83d81d3 --- /dev/null +++ b/full_models/nst/vocab.txt @@ -0,0 +1,27 @@ +h +ü +p +s +i +d +a +y +j + +z +t +' +ā +v +n +l +k +b +m +o +g +e +c +_ +r +u diff --git a/full_models/nsu/D_100000.pth b/full_models/nsu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0c1bba13b56a60ae6c3666dd3244a7314c8243d7 --- /dev/null +++ b/full_models/nsu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51191e309c964e5dd49811af3e0ae7cf803cf721491463c06f5dda5f11f7a8a8 +size 561078623 diff --git a/full_models/nsu/G_100000.pth b/full_models/nsu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6fa76aafd13f33b24a872a10ba48df23b99f7739 --- /dev/null +++ b/full_models/nsu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c186a590179f79179b2009e3e8e5d0b3a12908768a159dbc3e37ccf76266c261 +size 436386083 diff --git a/full_models/nsu/config.json b/full_models/nsu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nsu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nsu/vocab.txt b/full_models/nsu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b743472c2077e29b051f983026c464366df717a6 --- /dev/null +++ b/full_models/nsu/vocab.txt @@ -0,0 +1,41 @@ +q +1 +i +ó +y +l +a +e +2 +— +í +m +p +4 +j +s +z +d +h +b +u +c +r + +v +w +k +n +t +ñ +0 +_ +5 +g +á +x +6 +é +f +o +ú diff --git a/full_models/ntm/D_100000.pth b/full_models/ntm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1aa718752291e265cacb4f1841cd28b76c637656 --- /dev/null +++ b/full_models/ntm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7bc53e370aee5e07b5fca81fadc9944b57aa152d5f4cfcd525fd0a48e8a257 +size 561078750 diff --git a/full_models/ntm/G_100000.pth b/full_models/ntm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dbe6b97a3065c2f27b300d02e396e75f5cde1110 --- /dev/null +++ b/full_models/ntm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c5520d9a0db1d179a54f03cd14699e195bec71ae24602654614d60c629fd65 +size 436390647 diff --git a/full_models/ntm/config.json b/full_models/ntm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ntm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ntm/vocab.txt b/full_models/ntm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..175a09ef1ff69b06101e61bc328e0f932ab06993 --- /dev/null +++ b/full_models/ntm/vocab.txt @@ -0,0 +1,42 @@ +ù +ǹ +e +a +í +ṵ +ɔ +̰ +ɛ +̀ +c +n +- +k +à +o +p +y +f +ḿ +b +́ +è +ú +w +i +ó +ḭ +t +' +u +á +s +é +ń +_ +ì +d + +h +m +ò diff --git a/full_models/ntr/D_100000.pth b/full_models/ntr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa29f6f2ec8a6b743b29e1038d59839c66e988e4 --- /dev/null +++ b/full_models/ntr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4d114d38a6e6b56d16dc7cc58a454b82584e972a0f5fd7373d67a925f05ef6b +size 561078618 diff --git a/full_models/ntr/G_100000.pth b/full_models/ntr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02d10d437888ab74a97f26520a89bb0cca1b8a0b --- /dev/null +++ b/full_models/ntr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c652a812f5162a6959aa9a01f337af0610f7681db12258897311717276401b1e +size 436355123 diff --git a/full_models/ntr/config.json b/full_models/ntr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ntr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ntr/vocab.txt b/full_models/ntr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3f3866bb3eba0e53d7bda88d3774ec517da65129 --- /dev/null +++ b/full_models/ntr/vocab.txt @@ -0,0 +1,28 @@ +| +a +e +n +ɛ +o +ŋ +ↄ +k +y +b +i +m +l +u +d +t +w +s +r +g +p +f +' +h +3 +0 + diff --git a/full_models/nuj/D_100000.pth b/full_models/nuj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..18cb977d6428549821407ae15f65014d37fbdd50 --- /dev/null +++ b/full_models/nuj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65b87b57ebdc0906b2d92de99666107f4046cad17c1a32a95a9ec9b626452651 +size 561078998 diff --git a/full_models/nuj/G_100000.pth b/full_models/nuj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ebbf55c574e3b0aabba66aacc937b5051f2283c5 --- /dev/null +++ b/full_models/nuj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80561914b59c7751ef782886fd17214e5783c6e1d6074a90f13a95aed0f4b85e +size 436364838 diff --git a/full_models/nuj/config.json b/full_models/nuj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nuj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nuj/vocab.txt b/full_models/nuj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c1dce24d9f972e5228395a01c969d287ee7cf312 --- /dev/null +++ b/full_models/nuj/vocab.txt @@ -0,0 +1,30 @@ +m +j +p +a +v +s +l +_ +w +f +y +k +r +d +b +e +n +' +u +- +ŋ +z +i +g +o +h + +c +ʼ +t diff --git a/full_models/nus/D_100000.pth b/full_models/nus/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f587cdf90df9fd76ece7156c022cef30dc5eca6f --- /dev/null +++ b/full_models/nus/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8916e60cf78a5ebfa97525b5fed836734ce3d62718a255298669997808616268 +size 561078987 diff --git a/full_models/nus/G_100000.pth b/full_models/nus/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9d3ec5caace0c17f96d24e90f3a9c8743faffeb2 --- /dev/null +++ b/full_models/nus/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8ed31163c0ca2d75b6e946d26958f2326e5ff63d90467b9746456fd54f2aa96 +size 436373627 diff --git a/full_models/nus/config.json b/full_models/nus/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nus/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nus/vocab.txt b/full_models/nus/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8f7feaf73a34c91ae14f597afd7d88e15e357928 --- /dev/null +++ b/full_models/nus/vocab.txt @@ -0,0 +1,34 @@ +| +ɛ +k +i +a +n +t +̱ +ä +u +c +ɔ +l +r +m +h +d +e +y +j +ö +ŋ +b +ë +o +ɣ +w +p +g +- +̈ +' +1 + diff --git a/full_models/nuz/D_100000.pth b/full_models/nuz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..70f513a2a28e9f54fc228da9d0980589408e9bd8 --- /dev/null +++ b/full_models/nuz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78ffe2bc61bb7eda1f0808042e2885d1cf7e343387744d41d88358568067b51 +size 561076157 diff --git a/full_models/nuz/G_100000.pth b/full_models/nuz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..15efb14323f0ee640bdeab3c5e98004e40a10857 --- /dev/null +++ b/full_models/nuz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46435fdb9c56828def6c3add01ab7a7bbaf0e1ba8f6fec2cca1d3b37f7c3a773 +size 436350771 diff --git a/full_models/nuz/config.json b/full_models/nuz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nuz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nuz/vocab.txt b/full_models/nuz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7a918b7972e9d75245aa5bc3309b8378280bbd49 --- /dev/null +++ b/full_models/nuz/vocab.txt @@ -0,0 +1,34 @@ +í +u +e +r +z +_ +é +t +g + +f +ú +s +l +h +p +i +o +q +c +a +ñ +á +x +k +m +ó +— +j +b +y +n +v +d diff --git a/full_models/nwb/D_100000.pth b/full_models/nwb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0575ae45359eb9978c517b3776cc1b1ce511a585 --- /dev/null +++ b/full_models/nwb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f662b4a330b6556b17e1bc6e1b9b60cd3d696691dbf49a9fdc2ce690f1e1455f +size 561076192 diff --git a/full_models/nwb/G_100000.pth b/full_models/nwb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..65edb18b0c9542bed5c1112e7a0bfd2aa2a937db --- /dev/null +++ b/full_models/nwb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d55814814ff855a910f37cbf4dd21cbace0729a55aee8333c044b638c7b6753 +size 436348839 diff --git a/full_models/nwb/config.json b/full_models/nwb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nwb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nwb/vocab.txt b/full_models/nwb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d0285cba42a4a1bfe1cb93841a9ee42e30216300 --- /dev/null +++ b/full_models/nwb/vocab.txt @@ -0,0 +1,33 @@ +| +' +a +- +n +e +l +ɔ +ʋ +i +ɩ +y +k +ɛ +b +m +o +u +g +h +d +z +t +p +w +s +r +f +j +c +v +q + diff --git a/full_models/nxq/D_100000.pth b/full_models/nxq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..92520a4a90b3ce8b85201e9f04f6c11edd3f4785 --- /dev/null +++ b/full_models/nxq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c14bd72a9fda5dbfb4fda1ed1656b659387bb19f72ed24199bdcdb4ba5b719 +size 561078839 diff --git a/full_models/nxq/G_100000.pth b/full_models/nxq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8138e91c181517f605c16b95982a1936c54d33fb --- /dev/null +++ b/full_models/nxq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7606c5ea0faf954494848d38e90c0731fed5e2f5b5606bfa9084bff1d5c1bfdf +size 436359016 diff --git a/full_models/nxq/config.json b/full_models/nxq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nxq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nxq/vocab.txt b/full_models/nxq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..402713b2492ce3309f368aba77e602615226b269 --- /dev/null +++ b/full_models/nxq/vocab.txt @@ -0,0 +1,29 @@ +n +b +_ +l +m +u + +' +e +x +r +w +o +p +j +d +a +k +h +z +y +i +g +f +t +v +s +c +q diff --git a/full_models/nya/D_100000.pth b/full_models/nya/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fdda7360da5eaa78955d0b8d17c3a8cd52e9f3c1 --- /dev/null +++ b/full_models/nya/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d805789c8aea5bfc84772a7892ed9838ead816565634214c483140e5e45f9e66 +size 561110384 diff --git a/full_models/nya/G_100000.pth b/full_models/nya/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa3151cf744cbc85a5b63575d4f8a3f3e1888fe2 --- /dev/null +++ b/full_models/nya/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86c3dfd33c909723fae3bdbcfb091fd2c6b1c39adef691103f4f18d858afa0f +size 436622468 diff --git a/full_models/nya/config.json b/full_models/nya/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nya/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nya/vocab.txt b/full_models/nya/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..1e72ecf80c1e9c791c5812469c18031a26e459d5 --- /dev/null +++ b/full_models/nya/vocab.txt @@ -0,0 +1,39 @@ +m +w +i +_ +7 +u +d +z +b +q +p +o +4 +g +v +e +' +c +3 +9 +y +t +5 +ʼ +8 +k +a +2 +s +h +f +r +1 +n +0 +l + +6 +j diff --git a/full_models/nyf/D_100000.pth b/full_models/nyf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9d0be71582d67e79ccd091af10eefac0a0cf74f0 --- /dev/null +++ b/full_models/nyf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500c151390d69a433af8dcb9d8ecadd6d59b5550b6292a8d44a8305de46d0688 +size 561078869 diff --git a/full_models/nyf/G_100000.pth b/full_models/nyf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49fd5d433d4581d6c7592874de9a49444d5a1c6f --- /dev/null +++ b/full_models/nyf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ffc024f04bbb438ef4a42fc1a7603e25107bbf53735e90adb3c1c069c4f6be +size 436358914 diff --git a/full_models/nyf/config.json b/full_models/nyf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nyf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nyf/vocab.txt b/full_models/nyf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c22eddf49f53d9e25c2732e92c3394edf4919e25 --- /dev/null +++ b/full_models/nyf/vocab.txt @@ -0,0 +1,29 @@ +a +| +i +u +n +k +m +e +h +o +w +r +l +z +d +g +y +s +t +b +' +v +f +j +c +p +̱ +- + diff --git a/full_models/nyn/D_100000.pth b/full_models/nyn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..52e51858a80303d57fd097a722f4155977c8611f --- /dev/null +++ b/full_models/nyn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc498289111a27ee8c1352e2666ff4889da0cc158dd56862e78b299ba5f4bb53 +size 561078614 diff --git a/full_models/nyn/G_100000.pth b/full_models/nyn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d6eec4ba4725f17bd4c29cb043a5b7e939d8b10 --- /dev/null +++ b/full_models/nyn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ce29a6f4d51fda76a19c3d1446f9edba81e239d5f76bc8e98c74515b3fb00c +size 436355236 diff --git a/full_models/nyn/config.json b/full_models/nyn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nyn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nyn/vocab.txt b/full_models/nyn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..60cc97283bc91c2ec937d849a741d06c5fbe2238 --- /dev/null +++ b/full_models/nyn/vocab.txt @@ -0,0 +1,28 @@ +a +| +i +e +u +r +n +o +k +b +m +w +y +g +h +t +s +' +z +d +j +l +p +f +c +- +v + diff --git a/full_models/nyo/D_100000.pth b/full_models/nyo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..63ff0d2fa4f5ce120a4a36063f59b5c0bac4fac3 --- /dev/null +++ b/full_models/nyo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf4c559e5410b750ec9110b337635a7183f3dd51b06ff69a341363c3238bb4e +size 561078966 diff --git a/full_models/nyo/G_100000.pth b/full_models/nyo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..15c72f109dc2c627d3f0d58af2d6ca5918ab3628 --- /dev/null +++ b/full_models/nyo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe47bbcf1a22bdc4f42285563407ef34ad42a650abf3ad6775fa9a316f3377d +size 436358686 diff --git a/full_models/nyo/config.json b/full_models/nyo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nyo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nyo/vocab.txt b/full_models/nyo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..753699284fc68690e6688867f69f2a3e141bd996 --- /dev/null +++ b/full_models/nyo/vocab.txt @@ -0,0 +1,28 @@ +a +| +i +u +e +n +o +b +k +r +m +w +g +y +t +h +s +z +l +' +d +j +f +p +c +- +v + diff --git a/full_models/nyy/D_100000.pth b/full_models/nyy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2982a2c158b017606ecc201fe7970e35175b7893 --- /dev/null +++ b/full_models/nyy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6913121a896762319a44dfd9e04e4c23385c48a856364dd0a3291c4c647aa0f8 +size 561078875 diff --git a/full_models/nyy/G_100000.pth b/full_models/nyy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..512b25a48c2fa2ae5326b4603212496d83009e85 --- /dev/null +++ b/full_models/nyy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8097596eeb16cce7fdf7e928d67fdde224f2b2ad2989b6189b0913555c467d4 +size 436398677 diff --git a/full_models/nyy/config.json b/full_models/nyy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nyy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nyy/vocab.txt b/full_models/nyy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7ed4b98997354d2c0c70b6147077e8b5bdaaefa4 --- /dev/null +++ b/full_models/nyy/vocab.txt @@ -0,0 +1,45 @@ +| +a +u +n +l +k +ị +b +i +m +o +e +g +s +w +t +y +ụ +p +j +ā +̄ +f +d +ō +ū +ī +ē +h +' +ạ +ḳ +ẹ +ọ +r +̣ +ṣ +ṃ +ḷ +v +ḅ +ỵ +ȳ +ẉ + diff --git a/full_models/nzi/D_100000.pth b/full_models/nzi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8b7eeb3f1f5d1c620e057115e89b5fd418a18e60 --- /dev/null +++ b/full_models/nzi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb22d27d3eb4eaa9acd306bdf2357c1120cf7f01059581352bd495004b7134b +size 561079372 diff --git a/full_models/nzi/G_100000.pth b/full_models/nzi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7cf98d3c455050ea5e119916d4882f29f49bdc70 --- /dev/null +++ b/full_models/nzi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2db5428e8375fc2186832450b9b57d2837dcd5fd2967129b305323d0485ebe3a +size 436371691 diff --git a/full_models/nzi/config.json b/full_models/nzi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/nzi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/nzi/vocab.txt b/full_models/nzi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6f39dbf2a8dc50b2e2b682af848a87995ad2f82e --- /dev/null +++ b/full_models/nzi/vocab.txt @@ -0,0 +1,33 @@ +m +1 +d +_ +c +i +n +- +u +2 +ɛ +f +l +k +h +a +5 +' +g + +y +w +o +z +9 +v +ɔ +b +s +r +p +e +t diff --git a/full_models/obo/D_100000.pth b/full_models/obo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cced2ebf9e1e3731e11362f9bbcd4834f9da2b74 --- /dev/null +++ b/full_models/obo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec70e55b16eb0e1c9deac1925f9dfe399038a6e7f85d9551c7ead4d4c1b400d +size 561078120 diff --git a/full_models/obo/G_100000.pth b/full_models/obo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7d2dc4e9fe198c0744f8690160d0f3838dcf1f73 --- /dev/null +++ b/full_models/obo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ad79d182469503aba1152db6b059062a8dc1f3fe5baba887b845f35b6a37c9f +size 436353121 diff --git a/full_models/obo/config.json b/full_models/obo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/obo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/obo/vocab.txt b/full_models/obo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3841c095585a227e7d06fb1c186b685f19026524 --- /dev/null +++ b/full_models/obo/vocab.txt @@ -0,0 +1,30 @@ +z +v +p +u +' +a +s +m +_ +d +r +h +k +- +b +i +f +g +j +q +w +c +x + +n +y +o +e +t +l diff --git a/full_models/ojb-script_latin/D_100000.pth b/full_models/ojb-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..83aaa210fa2da5dcdee38995c7c921bda9edbb19 --- /dev/null +++ b/full_models/ojb-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8faffaa4a5f825245fa909891b230decee0e1396f534994f9b973f59482a77b +size 561078638 diff --git a/full_models/ojb-script_latin/G_100000.pth b/full_models/ojb-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..30d7b171e0d25b95b82614df0b82ee1e26944f24 --- /dev/null +++ b/full_models/ojb-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ee12690cff54f0a3399be1e535b2dc3d23e48ca0df134d890c4d12249edde7 +size 436351029 diff --git a/full_models/ojb-script_latin/config.json b/full_models/ojb-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ojb-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ojb-script_latin/vocab.txt b/full_models/ojb-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d2469d89fe62eba479225272cadb142f50cacf5f --- /dev/null +++ b/full_models/ojb-script_latin/vocab.txt @@ -0,0 +1,26 @@ +i +a +k +| +n +h +o +t +s +e +w +m +c +' +p +y +- +r +l +– +2 +0 +3 +z +5 + diff --git a/full_models/ojb-script_syllabics/D_100000.pth b/full_models/ojb-script_syllabics/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ad50e4ac057561e1a604531c77225c8123729010 --- /dev/null +++ b/full_models/ojb-script_syllabics/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35554ad9113febb19773adaf86fbf66ffbedbddf5bfe70bf27bd694084a434f +size 561078706 diff --git a/full_models/ojb-script_syllabics/G_100000.pth b/full_models/ojb-script_syllabics/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0edd15d4a724551bd29a8465ee8d7357232208ad --- /dev/null +++ b/full_models/ojb-script_syllabics/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:749cf835ce1b9965ca2c4e5c7a030ab1a0164a35b1f7481161bb8c87f725cb44 +size 436653651 diff --git a/full_models/ojb-script_syllabics/config.json b/full_models/ojb-script_syllabics/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ojb-script_syllabics/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ojb-script_syllabics/vocab.txt b/full_models/ojb-script_syllabics/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..88e4bf90c3cd6f369a884b210cc0729c4eb341a0 --- /dev/null +++ b/full_models/ojb-script_syllabics/vocab.txt @@ -0,0 +1,156 @@ +| +ᓂ +ᐃ +ᓐ +ᑕ +ᑭ +ᒋ +ᑳ +ᐅ +ᑮ +ᑲ +ᒡ +ᐊ +ᒃ +ᔥ +ᔑ +ᐙ +ᐎ +ᓇ +ᐁ +ᑫ +ᑯ +ᒫ +ᓯ +ᒥ +ᑎ +ᐱ +ᒪ +ᐐ +ᐌ +ᓈ +ᕽ +ᔦ +ᐗ +ᐸ +ᒦ +ᑑ +ᐋ +ᑖ +ᑌ +ᓴ +ᔮ +ᓃ +ᔭ +ᑰ +ᐯ +ᓀ +ᐲ +ᓄ +ᔐ +ᑾ +ᐞ +ᒧ +ᓰ +ᒀ +ᔕ +ᓅ +ᒻ +ᑐ +ᑴ +ᔅ +ᒌ +ᓱ +ᐹ +ᓭ +ᒣ +ᐺ +ᓵ +ᒨ +ᒑ +ᔖ +ᓬ +a +ᕒ +e +ᐄ +x +ᔓ +s +ᐴ +ᑣ +ᔒ +ᐆ +ᒎ +ᐳ +ᑦ +i +r +ᓍ +ᓲ +ᓉ +ᔔ +l +ᑏ +ᒐ +ᑆ +m +h +o +u +p +t +ᐤ +n +ᑸ +j +d +ᔣ +ᒉ +c +ᔂ +ᔫ +ᔨ +ᒞ +ᑉ +ᔗ +ᑗ +ᔩ +b +2 +y +0 +g +3 +ᓶ +1 +v +ᒬ +ᑶ +4 +7 +z +ᔪ +ᐾ +ᓋ +– +ᒸ +ᒶ +ᔛ +k +ᒍ +8 +f +5 +w +ᔀ +9 +6 +ᔾ +ᔡ +ᐼ +ᐧ +ᒁ +q +ᒒ + diff --git a/full_models/oku/D_100000.pth b/full_models/oku/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ef8659e086ab61ce32530ed5e030be7e879e0381 --- /dev/null +++ b/full_models/oku/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c83d5f30db98128859ad453a508c355c0f96bdef020cc7b116a092e260af329c +size 561078998 diff --git a/full_models/oku/G_100000.pth b/full_models/oku/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c91820c8d159b733d642d6369ce157e4f8f29471 --- /dev/null +++ b/full_models/oku/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f581ec4a33941af8118101a096096525340d4c9f957fa6c3388f1c26ea9331 +size 436406639 diff --git a/full_models/oku/config.json b/full_models/oku/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/oku/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/oku/vocab.txt b/full_models/oku/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b315a2747ce9c9d77e02ac94e09f3a1c0fae5b5b --- /dev/null +++ b/full_models/oku/vocab.txt @@ -0,0 +1,49 @@ +| +e +n +ɛ +y +i +s +k +g +l +a +h +ə +b +u +m +o +w +t +f +è +j +d +ŋ +c +́ +̀ +à +á +v +- +ò +̂ +é +ó +î +r +ì +ô +z +í +ú +û +â +ê +ù +1 +3 + diff --git a/full_models/old/D_100000.pth b/full_models/old/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..df12a77b0863b91ba7fd922878414b2fee21d1a6 --- /dev/null +++ b/full_models/old/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3b3df88a865bf132af915695fb736582fd02b55d75feaea6ff6786ed1bf1b9 +size 561078861 diff --git a/full_models/old/G_100000.pth b/full_models/old/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..911fd2582bf39a1f945dcf6839d4acee92649190 --- /dev/null +++ b/full_models/old/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1487b26174998a715f9a2b1799a6627fec985cdd6bf52a02ea883504b0022b +size 436368005 diff --git a/full_models/old/config.json b/full_models/old/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/old/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/old/vocab.txt b/full_models/old/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d29ecae6fe30a323eb607c571816023ca39ab939 --- /dev/null +++ b/full_models/old/vocab.txt @@ -0,0 +1,32 @@ +| +a +i +n +o +u +k +e +y +w +m +h +l +d +s +f +t +r +c +g +b +ṟ +p +- +j +' +z +v +̱ +ḏ +ḵ + diff --git a/full_models/omw/D_100000.pth b/full_models/omw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0396e5e2775661231f5d926978560282815873a9 --- /dev/null +++ b/full_models/omw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e72d54ace2131a0fd45c6387fcba9d7c67455089e71e27de456a0df4519f6f7 +size 561076183 diff --git a/full_models/omw/G_100000.pth b/full_models/omw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f562bb80330d6cfb881ed048d35775952fbcb3f5 --- /dev/null +++ b/full_models/omw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c7db07444e6b43dc28f422ab118e754c5e9305898b6251310d21b380be0d9e7 +size 436344493 diff --git a/full_models/omw/config.json b/full_models/omw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/omw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/omw/vocab.txt b/full_models/omw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..48d94f64034ef1fb3e059593eb4caef5dacebcf0 --- /dev/null +++ b/full_models/omw/vocab.txt @@ -0,0 +1,31 @@ +q +k +4 +6 +7 +9 +- +m +0 +s +u +e +t +a +8 +i + +w +h +p +v +3 +5 +1 +y +o +_ +2 +r +n +f diff --git a/full_models/onb/D_100000.pth b/full_models/onb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..500cfe879aca4abeafe8c298487303cbefce35b6 --- /dev/null +++ b/full_models/onb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb86469f9d3108249ecbde9640fc93af7b348c4d2e638b8176426504ee4f05c2 +size 561078322 diff --git a/full_models/onb/G_100000.pth b/full_models/onb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9bad43362519b23d21cba62e8214a72bbc52e103 --- /dev/null +++ b/full_models/onb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4be476b80026a96c6bd7c466aca4f79e576ab0cfc8e22337ec0f30286e6de5 +size 436346970 diff --git a/full_models/onb/config.json b/full_models/onb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/onb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/onb/vocab.txt b/full_models/onb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..57c995aa9af735ad52bb20ae9733df31aaf5fd68 --- /dev/null +++ b/full_models/onb/vocab.txt @@ -0,0 +1,27 @@ + +s +_ +z +y +a +n +v +d +o +m +x +i +h +b +p +f +e +- +u +t +q +— +' +l +k +g diff --git a/full_models/ood/D_100000.pth b/full_models/ood/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5303bb5952ed31ba525efd2edb7146b3f5708cc --- /dev/null +++ b/full_models/ood/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b100e9ca4d79f676887cc05dd02a320107550e4945f29e85c96e1b172127ba59 +size 561078640 diff --git a/full_models/ood/G_100000.pth b/full_models/ood/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6df09afecaa5508ce6d38760cc87cadc7fdec4a0 --- /dev/null +++ b/full_models/ood/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c38e91611f7449356e655ab1a4f6c7c3940b77e3bdb5ad2bba9e322020b280 +size 436355874 diff --git a/full_models/ood/config.json b/full_models/ood/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ood/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ood/vocab.txt b/full_models/ood/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24fc3597fc13479af56e23159cfa10762a67e48e --- /dev/null +++ b/full_models/ood/vocab.txt @@ -0,0 +1,30 @@ +y +h +i +o +l +g +a +' +p +e +b +s +r +x +m +z +f +t +d +w +k +u +j +c +n +v +_ +- + +q diff --git a/full_models/orm/D_100000.pth b/full_models/orm/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d0c2c63ab263aa58608621151d2435d67699a776 --- /dev/null +++ b/full_models/orm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf83606c8ec2e300d3746b283ea950c8613bbf963cd48ee44e5149bf926f54c8 +size 561078722 diff --git a/full_models/orm/G_100000.pth b/full_models/orm/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..29d1babbfd0b5c8313156b32ea75bd64f09dc82c --- /dev/null +++ b/full_models/orm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef10a08de2bf446e245a7affcb75792e783d08f855e2ef762ab2fea2516b28a +size 436358347 diff --git a/full_models/orm/config.json b/full_models/orm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/orm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/orm/vocab.txt b/full_models/orm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..71d4b7e35a6b8ca26b95e3a43feb8c4723e858c9 --- /dev/null +++ b/full_models/orm/vocab.txt @@ -0,0 +1,29 @@ +r +' +- +f +b +n +j +y +t +d +z +m +e +h +u +q +p +a + +_ +o +x +s +w +g +i +c +l +k diff --git a/full_models/ory/D_100000.pth b/full_models/ory/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d2277bd05868b38404b82dbc11a40e733f0a2492 --- /dev/null +++ b/full_models/ory/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890450d13cce741c85d7ee25b324cfdd44048849774d330efa3acc34c1819ba9 +size 561110145 diff --git a/full_models/ory/G_100000.pth b/full_models/ory/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..31bdd43cbfbcddb3a62b42ee4031da5225491436 --- /dev/null +++ b/full_models/ory/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:874db533e7379be240d27e837531257770f6b15f31a9c9ca97245636f3a517e3 +size 436705382 diff --git a/full_models/ory/config.json b/full_models/ory/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ory/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ory/vocab.txt b/full_models/ory/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..701231bec5476270f6374395dcae3c40e50bcdd8 --- /dev/null +++ b/full_models/ory/vocab.txt @@ -0,0 +1,76 @@ +ଛ +ୂ +– +ବ +ଞ +ଯ +ଇ +ପ +ନ +ର +ଆ +ଅ +0 +ଠ +4 +ଦ +ଙ +ଋ +େ +ଈ +ୈ +ଘ +ଏ +ଖ +ମ +ଳ +ଃ +1 +ଓ +ଊ +7 +ି +2 +ୃ +ଶ +ଣ +ଥ +ଟ +ଡ +ା +ଁ +ଭ +କ +ୀ +ୱ +' +ଂ +ଫ +ଗ +ଚ +଼ +ତ +5 +_ +ଐ +ଔ +- +ଧ + +ଢ +ଜ +ଲ +ଉ +9 +6 +­ +ୋ +୍ +ସ +ୟ +ଝ +ହ +3 +ୌ +ୁ +ଷ diff --git a/full_models/oss/D_100000.pth b/full_models/oss/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20da5a3d1d1c809b99bb6fe6c5ed96d69cf9427d --- /dev/null +++ b/full_models/oss/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b48b02331092b7447fe96055bbd619397f06dcc3fbb008bf72165ef4964b374 +size 561078463 diff --git a/full_models/oss/G_100000.pth b/full_models/oss/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8738d6e14f54bbd719b20c530ed654f8cd729978 --- /dev/null +++ b/full_models/oss/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f13f4d2100eda886ece049bd0a1655571fdab509500bf6a9b32730bfb38464f1 +size 436368033 diff --git a/full_models/oss/config.json b/full_models/oss/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/oss/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/oss/vocab.txt b/full_models/oss/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f829245d214e60872699711d3d42bd2c1dd3b9b6 --- /dev/null +++ b/full_models/oss/vocab.txt @@ -0,0 +1,34 @@ +| +ӕ +ы +а +д +у +н +т +р +м +с +й +х +и +г +з +о +ц +к +л +ф +ъ +б +е +в +п +ч +ж +– +' +- +э +ю + diff --git a/full_models/ote/D_100000.pth b/full_models/ote/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7bf54d94849a6c353f538c351f72dac9a7d4cf57 --- /dev/null +++ b/full_models/ote/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100d89e373ca1429082ea3810a60368582d1e64bf7de9a02bddd6f7bc198b413 +size 561078618 diff --git a/full_models/ote/G_100000.pth b/full_models/ote/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..060c4195296e4b1544f201058ce0c7a79f447867 --- /dev/null +++ b/full_models/ote/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cebcb9f529edec09814c8d58948ffd759db7d86e94b0080c032b208a3e7a796 +size 436382766 diff --git a/full_models/ote/config.json b/full_models/ote/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ote/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ote/vocab.txt b/full_models/ote/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..016d6d41eb2a0e908aa434092114b766bb22642f --- /dev/null +++ b/full_models/ote/vocab.txt @@ -0,0 +1,40 @@ +| +a +n +i +' +u +e +h +t +d +r +g +o +̱ +m +ʉ +b +y +j +s +p +á +x +c +ñ +ɛ +ú +ø +í +f +z +q +l +́ +ó +v +é +ü +k + diff --git a/full_models/otq/D_100000.pth b/full_models/otq/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..ffb7a7ee07b196ba3b2059b22564d33be74d04cf --- /dev/null +++ b/full_models/otq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2355bb9866f6837754c6dd97cf47b07548d3a5641e56a33bebe4b926bbd7687a +size 561078973 diff --git a/full_models/otq/G_100000.pth b/full_models/otq/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..5921856b9d43f7f27105f3f11cf4067aa41af64a --- /dev/null +++ b/full_models/otq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c3c5566eee4dac1a1ce45c92458301c04388ba704269fd0fe38623c1eac82c6 +size 436379540 diff --git a/full_models/otq/config.json b/full_models/otq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/otq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/otq/vocab.txt b/full_models/otq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f295a91d6422eef3334e066e31ad5a2543e6d216 --- /dev/null +++ b/full_models/otq/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +n +h +̱ +u +' +e +t +m +o +g +r +ö +d +b +y +s +x +j +ñ +p +k +á +w +f +z +l +ú +ë +— +ó +é +í +c + diff --git a/full_models/ozm/D_100000.pth b/full_models/ozm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f69fc547579cddf7bb050d535e3109e6dc785727 --- /dev/null +++ b/full_models/ozm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce6b61a791800a29bf2438b0af4320a839c379a62c25881aa9818c4c208160d +size 561078348 diff --git a/full_models/ozm/G_100000.pth b/full_models/ozm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d72a3f5800d2d94457363e1d05aee6d9fbc7559c --- /dev/null +++ b/full_models/ozm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842c70b08b3c5865520e72822e8d842c270c0b3c87d6ca6bc8dccec990485524 +size 436431157 diff --git a/full_models/ozm/config.json b/full_models/ozm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ozm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ozm/vocab.txt b/full_models/ozm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d14ee9a24e475d508c512b5f2386ab03f217d26a --- /dev/null +++ b/full_models/ozm/vocab.txt @@ -0,0 +1,61 @@ +| +b +́ +m +n +e +ɨ +y +é +l +á +ó +a +ɛ +ʉ +s +ʼ +í +̂ +t +w +ɔ +o +ɑ +r +̌ +k +i +j +d +g +p +z +h +â +u +ú +ě +c +î +ŋ +ǎ +ê +û +ô +ø +ǿ +ǐ +ǒ +- +œ +' +f +v +ï +ǔ +q +x +ë +̍ + diff --git a/full_models/pab/D_100000.pth b/full_models/pab/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..573d3f7b185390f3154c40d52a5a4e409a09a6cd --- /dev/null +++ b/full_models/pab/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa25bd3068a611986da49219700f861f666990b56a7a03400617cb2bb852f52 +size 561078981 diff --git a/full_models/pab/G_100000.pth b/full_models/pab/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..477f7a4a070b653e9ddab3f452331ab593eec9e0 --- /dev/null +++ b/full_models/pab/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09602680d28eb06a0e83403c58c4b81381bd5425f4b670ca414ebd03d362a82c +size 436410037 diff --git a/full_models/pab/config.json b/full_models/pab/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pab/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pab/vocab.txt b/full_models/pab/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..394ceb79e0b34783ffbd5e9ebc9ee166689110fa --- /dev/null +++ b/full_models/pab/vocab.txt @@ -0,0 +1,50 @@ +a +| +e +i +o +h +t +k +n +y +r +x +s +m +l +w +j +u +— +b +d +c +f +p +é +á +ã +- +g +0 +ó +v +q +í +1 +z +2 +ô +4 +7 +5 +ê +ú +6 +3 +8 +9 +â +' + diff --git a/full_models/pad/D_100000.pth b/full_models/pad/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9b3570466eae589a10f927ef88c5eeb966aeec47 --- /dev/null +++ b/full_models/pad/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c4dfe86aabb88a72588ad41449dcdfbf611c0a2b0bf0fa07636215aa0cbf53 +size 561076196 diff --git a/full_models/pad/G_100000.pth b/full_models/pad/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9e8a5c11c53591f4d74321528b051a6031c38c3a --- /dev/null +++ b/full_models/pad/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0c7da66c200c152ff56da11d07419d03d4b8f7b237d2c8b93cb6a4c4a98ef83 +size 436390469 diff --git a/full_models/pad/config.json b/full_models/pad/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pad/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pad/vocab.txt b/full_models/pad/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..55faf67d239a238c09b845c752bbf32b99ec7be8 --- /dev/null +++ b/full_models/pad/vocab.txt @@ -0,0 +1,51 @@ +a +i +| +n +o +h +k +r +v +d +' +j +b +s +m +e +u +t +- +g +p +f +c +— +l +é +ã +x +á +ó +q +z +í +ô +1 +0 +7 +2 +4 +â +ê +ú +5 +6 +ç +3 +8 +9 +î +õ + diff --git a/full_models/pag/D_100000.pth b/full_models/pag/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5104a1b2a70a9b2848a030b956ccea7a4ee137f4 --- /dev/null +++ b/full_models/pag/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a36e82da769fdfb9a4244d971212b6e3a7f6ca98a4ff386e978f80bb67fdd93 +size 561078754 diff --git a/full_models/pag/G_100000.pth b/full_models/pag/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..644006d223a88ac4e26503740e0f4661e48898f4 --- /dev/null +++ b/full_models/pag/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0926c8a21af32a2a3072b7a8cffaf102ad05a12c017c8f8dc5b5e6d35f0ac06 +size 436368211 diff --git a/full_models/pag/config.json b/full_models/pag/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pag/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pag/vocab.txt b/full_models/pag/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c5f858ae124447e11c42206ad06a53e4e6f456dd --- /dev/null +++ b/full_models/pag/vocab.txt @@ -0,0 +1,32 @@ +a +| +n +i +o +t +s +y +e +k +g +l +m +d +p +r +b +u +w +j +c +' +h +- +f +z +— +v +q +x +– + diff --git a/full_models/pam/D_100000.pth b/full_models/pam/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b856b28b459c5f3e918f3937346ab3f3e4eb213d --- /dev/null +++ b/full_models/pam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48da77d3eb582cdee26f9fd8c455aa56d9a67cfb66568062c7ece136755b9a3f +size 561078619 diff --git a/full_models/pam/G_100000.pth b/full_models/pam/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a090e42bbd6791150b94d93357c821827c65cf5b --- /dev/null +++ b/full_models/pam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32af4af643a0f9bccca064fab2f2943068bad00dc08a5e6576e740d0b0975047 +size 436366883 diff --git a/full_models/pam/config.json b/full_models/pam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pam/vocab.txt b/full_models/pam/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..24bc87974a20d7868f9f2adc75a73036068fa5cc --- /dev/null +++ b/full_models/pam/vocab.txt @@ -0,0 +1,33 @@ +a +| +n +i +g +u +k +t +l +m +e +s +p +b +y +d +r +o +w +j +h +c +- +f +z +v +' +q +x +— +6 +9 + diff --git a/full_models/pan/D_100000.pth b/full_models/pan/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fd94c408fdac3d0880604c0f0a308eec2cbcd268 --- /dev/null +++ b/full_models/pan/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a85d5ab4a43a95424cf898f9fe8e86b8a396d22ecc11a334042a588ec1ab54f +size 561110353 diff --git a/full_models/pan/G_100000.pth b/full_models/pan/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9416ac1025c52dcf235e17c39f5f5bffad76fd65 --- /dev/null +++ b/full_models/pan/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482da238fb549d5ca7e548a965dad1f6c14393dce69fffddb59e170c2bb9c904 +size 436667569 diff --git a/full_models/pan/config.json b/full_models/pan/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pan/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pan/vocab.txt b/full_models/pan/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..a52e4ea4fcd0bec0bed6fd48dfff8d3b94c51be0 --- /dev/null +++ b/full_models/pan/vocab.txt @@ -0,0 +1,59 @@ +ਏ +ਟ +ੰ +ੈ +ਠ +- +l +_ +ੜ +਼ +ਇ +ਪ +ਣ +ਥ +ਨ +ਸ +ਯ +ਫ +ਝ +ਊ +ਧ +ੁ +ਿ +ਜ +ਔ +ਦ +ੋ +ੌ +6 +ੂ +ਛ + +ੀ +ਗ +ਬ +੍ +ਐ +ਈ +ਘ +ਭ +ਂ +ਓ +ੇ +ਉ +ਅ +ਖ +ਡ +ਲ +ਆ +ਚ +ਵ +ਤ +ਹ +ਕ +ਢ +ਰ +ਾ +ਮ +ੱ diff --git a/full_models/pao/D_100000.pth b/full_models/pao/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f11f0ba2565e1f7fb139f8ef0a2da245d467bc2e --- /dev/null +++ b/full_models/pao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21283d46b5c7a70da8a3a35ec280accc96b87ccdfaa9e7be73afcb3522521b0 +size 561077835 diff --git a/full_models/pao/G_100000.pth b/full_models/pao/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4fedeeb33725eac0fd63a9a3a07b39fa09859e1e --- /dev/null +++ b/full_models/pao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6224b5f7e6f92d0066e69420385725215b88c63a4e6296842975f9c9ccfb33 +size 436367043 diff --git a/full_models/pao/config.json b/full_models/pao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pao/vocab.txt b/full_models/pao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b43d98fb6ce57c87178d5f8630d91676e5908b49 --- /dev/null +++ b/full_models/pao/vocab.txt @@ -0,0 +1,37 @@ +d +f +i +w +n +v +b +3 +m +_ +h +p +7 +l + +1 +ꞌ +q +6 +- +z +2 +x +u +y +j +8 +r +e +g +c +k +a +s +' +t +o diff --git a/full_models/pap/D_100000.pth b/full_models/pap/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f403a860f56d4e6b7f661d0383992690e9a71660 --- /dev/null +++ b/full_models/pap/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9f5d1be47e9edc850391da2f2f84220b016e62974b2620574097055d2214b7c +size 561078890 diff --git a/full_models/pap/G_100000.pth b/full_models/pap/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0923ab52bad97947bac6cb365013cf13ea8de07e --- /dev/null +++ b/full_models/pap/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62dec3c104848db1f1551e157533fd0626625f73682e1623d2421a10ece25834 +size 436411186 diff --git a/full_models/pap/config.json b/full_models/pap/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pap/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pap/vocab.txt b/full_models/pap/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dba21eb3d04f7441d51aa11d376eac0499bf9464 --- /dev/null +++ b/full_models/pap/vocab.txt @@ -0,0 +1,51 @@ +0 +' +f +7 +q +x +g +r +5 +_ +ó +y +4 +h +- +u +e +ù +b +l +n +o +— +z +2 +6 +m +ñ +j +ú +p +1 +t +a +ò +9 +8 +é +w +í +i +d +è +3 +c +s +ü +á + +v +k diff --git a/full_models/pau/D_100000.pth b/full_models/pau/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0cfb2441634031d950c103ea47a074860273c8f4 --- /dev/null +++ b/full_models/pau/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8105d1d8d76ac7a0a5d7943ed8145ad2152a7c3bbac2eeac1bdad779bf2225c4 +size 561078631 diff --git a/full_models/pau/G_100000.pth b/full_models/pau/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe6c8276fa742df65c5827857b1062685df5e2f9 --- /dev/null +++ b/full_models/pau/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34af65cdba27896e0be2b39e8e9ac8fe58a4cf93450cbe3e6113e3ec8c0caabf +size 436382877 diff --git a/full_models/pau/config.json b/full_models/pau/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pau/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pau/vocab.txt b/full_models/pau/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9450186ecc41ee684464e3558fd8a2725d6cb204 --- /dev/null +++ b/full_models/pau/vocab.txt @@ -0,0 +1,40 @@ +| +e +l +a +i +r +m +k +o +u +n +g +d +s +t +h +c +b +j +p +f +0 +y +v +' +x +4 +2 +- +1 +5 +9 +w +3 +7 +6 +— +8 +q + diff --git a/full_models/pbb/D_100000.pth b/full_models/pbb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6697d52f65a4a30efc8d966b37267c7f25cbed68 --- /dev/null +++ b/full_models/pbb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e23be90a9de85f6fd84b532d37faa71cf0d8faaee4bd0ec555d8e29e6662408 +size 561078590 diff --git a/full_models/pbb/G_100000.pth b/full_models/pbb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..53edfe12b063383b4f27311596a2cc32ccb7ec6e --- /dev/null +++ b/full_models/pbb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68a2e2ff8ddfbae07293840490ef1dcc4ba0cda194f31f51f0929a96c24e3d4 +size 436385193 diff --git a/full_models/pbb/config.json b/full_models/pbb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pbb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pbb/vocab.txt b/full_models/pbb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ddd6f0e1d9b6b802a5f17f4f347734d622548af0 --- /dev/null +++ b/full_models/pbb/vocab.txt @@ -0,0 +1,41 @@ +| +a +' +e +y +s +u +j +t +c +i +n +w +r +p +h +m +ã +v +d +ẽ +ũ +l +ĩ +g +o +á +q +f +z +é +b +í +— +ñ +- +ó +x +ú +k + diff --git a/full_models/pbc/D_100000.pth b/full_models/pbc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..732c4ea940fb69f0e086c77f298e0e7e77374f47 --- /dev/null +++ b/full_models/pbc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b660a3ad60a2a452b807901cf8ddc11cf6f0d8c5761c5e1d4c54b68bd1fd30b5 +size 561078733 diff --git a/full_models/pbc/G_100000.pth b/full_models/pbc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fda8fe0d3d845fd9c745110cb9bdc4ea6976b6e5 --- /dev/null +++ b/full_models/pbc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc4c6e015b184336660e10d09200e87e9cefa12cc273b4f248764a7e21d3430 +size 436390820 diff --git a/full_models/pbc/config.json b/full_models/pbc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pbc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pbc/vocab.txt b/full_models/pbc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..05b36ae929d81c4e78a5a490e16fe128490332a3 --- /dev/null +++ b/full_models/pbc/vocab.txt @@ -0,0 +1,42 @@ +| +a +k +p +n +e +o +t +à +i +l +ù +u +m +y +s +w +' +h +c +j +r +d +b +0 +g +1 +z +v +7 +2 +f +4 +5 +3 +6 +x +8 +9 +q +- + diff --git a/full_models/pbi/D_100000.pth b/full_models/pbi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b2ca9c915a3f522753bf3f91561636e3dd16e5f --- /dev/null +++ b/full_models/pbi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6654ecfbfedd4a86909e5bf7315cd2359c7fd3e9e37e060f84ba209f40c2fd0e +size 561078605 diff --git a/full_models/pbi/G_100000.pth b/full_models/pbi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a877a9f362f822e286dfc7146c60aae45bedcf53 --- /dev/null +++ b/full_models/pbi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fe4186c03f2472e61d9c4be864ba918d015178fe842525af1d39cb370ba303d +size 436373560 diff --git a/full_models/pbi/config.json b/full_models/pbi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pbi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pbi/vocab.txt b/full_models/pbi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b330cbb9d7498c9b3e212f5e94565e8fdfde223f --- /dev/null +++ b/full_models/pbi/vocab.txt @@ -0,0 +1,36 @@ +| +a +ə +k +n +d +m +l +t +e +i +s +w +ŋ +b +r +u +z +h +g +ɗ +y +v +ɨ +á +à +f +ɓ +́ +p +j +c +- +̌ +1 + diff --git a/full_models/pce/D_100000.pth b/full_models/pce/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a9013b624d299d9959cb3b826b25459c119c20c6 --- /dev/null +++ b/full_models/pce/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb171f77443e070af14bd102915c11dc70af138461da8e6be344ee3825247fc +size 561078718 diff --git a/full_models/pce/G_100000.pth b/full_models/pce/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7332452bdbc642a6a02bad2b853ba69761dc6969 --- /dev/null +++ b/full_models/pce/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d005a762dc0fcc33ebb109f7324daa6f3bdeacceb4dd35d171c59661c5d3019f +size 436381264 diff --git a/full_models/pce/config.json b/full_models/pce/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pce/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pce/vocab.txt b/full_models/pce/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..583e1c2d201fae7d61188b56a083e9c9faeb1fe5 --- /dev/null +++ b/full_models/pce/vocab.txt @@ -0,0 +1,39 @@ +| +อ +า +ี +เ +ด +น +ม +ห +บ +ต +แ +ว +โ +ย +ึ +ั +ู +ง +ร +ก +ฆ +ซ +ป +ฮ +ล +ะ +ฌ +ค +ณ +็ +พ +ื +จ +ท +ช +' +ฟ + diff --git a/full_models/pcm/D_100000.pth b/full_models/pcm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5920a5c2278449241ba8a15858b0c9a2eed767b2 --- /dev/null +++ b/full_models/pcm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b49d2529ee57f9482723657094107d772b642856f327f6e2adc4766e32b2a8 +size 561078480 diff --git a/full_models/pcm/G_100000.pth b/full_models/pcm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5df547b2c53a61b11d633d8fe532c1a3a3c7cc7d --- /dev/null +++ b/full_models/pcm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f411345bfb7598448e42b1d436dd5185e7fa90d657a8f35f97a78515fa230e0f +size 436373668 diff --git a/full_models/pcm/config.json b/full_models/pcm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pcm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pcm/vocab.txt b/full_models/pcm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4e87d6371c0753ba66d09ce6ddb1ebe7537e656c --- /dev/null +++ b/full_models/pcm/vocab.txt @@ -0,0 +1,36 @@ +| +e +o +a +i +n +d +s +t +r +y +l +m +w +k +u +g +p +f +b +h +v +c +j +- +z +x +0 +' +1 +2 +5 +4 +7 +3 + diff --git a/full_models/peg/D_100000.pth b/full_models/peg/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..e90756eb3c3214844675a1b04eb28687a091c412 --- /dev/null +++ b/full_models/peg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0929c65c62b710c3ca97ca06adb23dc5868c7233092d0841318bf403aca32f8 +size 561076025 diff --git a/full_models/peg/G_100000.pth b/full_models/peg/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d1659e2210bd012209efa1bd9ab35ecce7dffc1c --- /dev/null +++ b/full_models/peg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99a65f8606bc4ec1b933264e313855563498bba8582183a756876bcad487357 +size 436359085 diff --git a/full_models/peg/config.json b/full_models/peg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/peg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/peg/vocab.txt b/full_models/peg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f49a5ab790d5f783002eca7f6b3c8869b089e78b --- /dev/null +++ b/full_models/peg/vocab.txt @@ -0,0 +1,38 @@ +| +ା +୍ +ି +େ +ର +ନ +ତ +କ +ହ +ଜ +ୱ +ୁ +ଗ +ମ +ଂ +ଇ +ଆ +ସ +ଦ +ପ +ବ +଼ +ଚ +ଲ +ଡ +ଙ +ୟ +ଣ +ଟ +ଏ +‍ +ଞ +ଉ +ଅ +ଓ +ଃ + diff --git a/full_models/pez/D_100000.pth b/full_models/pez/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0c92e3f981ebf5688c1d151a18216cee10256314 --- /dev/null +++ b/full_models/pez/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbc938fb2952cfe83e391a8d877402a7ad45e8877ff4a2b156cde0492c6707ca +size 561078349 diff --git a/full_models/pez/G_100000.pth b/full_models/pez/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8eb66a63031fbd38d1cb09d6c61af5f8d4cb6da5 --- /dev/null +++ b/full_models/pez/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:260635ff6d750e91399574f0997318ab3a9706794f9da65dcf9ea4225909284a +size 436362051 diff --git a/full_models/pez/config.json b/full_models/pez/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pez/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pez/vocab.txt b/full_models/pez/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..562d5b726d75627886aaa793ffc7261f13b6c20a --- /dev/null +++ b/full_models/pez/vocab.txt @@ -0,0 +1,33 @@ +b +h +p +_ +- +g +l +0 +c +2 +u +n +o +6 + +a +j +i +e +v +1 +w +s +é +r +k +m +4 +y +z +d +t +' diff --git a/full_models/pib/D_100000.pth b/full_models/pib/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49746aae74c0cccd90d55c6eaf497e0ab52d6af8 --- /dev/null +++ b/full_models/pib/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69cd9e9714ba6aca6477904f067c1093a8fa8bcb268faa784c728a6f8acd82c3 +size 561078232 diff --git a/full_models/pib/G_100000.pth b/full_models/pib/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..41f985b5e68209f7535d70f7703af3b7c9a69f1d --- /dev/null +++ b/full_models/pib/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b4b838fcc5dd7df918106b5a71500d567ada418f0023fd6eb2223a339dce20 +size 436342989 diff --git a/full_models/pib/config.json b/full_models/pib/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pib/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pib/vocab.txt b/full_models/pib/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..30f406e6f3a1c0304b8bfe7543d74a3cfd271b4e --- /dev/null +++ b/full_models/pib/vocab.txt @@ -0,0 +1,24 @@ +u +j +— +s +n +l +r +e +t +' +k +c +x + +m +a +g +y +p +w +o +i +_ +h diff --git a/full_models/pil/D_100000.pth b/full_models/pil/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d549663fe9a3ae8167fbe0f1a88a2b0562ff0c4 --- /dev/null +++ b/full_models/pil/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b3c136b0cb6d1abdaf5e700bebad533782f37aab24eb1a22a451557e0dec98 +size 561078627 diff --git a/full_models/pil/G_100000.pth b/full_models/pil/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d5b59d2d51bde46a4fc11109a1bdb0d3c9773c34 --- /dev/null +++ b/full_models/pil/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2022cf67135de47be6f02fc4aba73c35d8900046d80f7513a3cbefbe7b4e4271 +size 436382796 diff --git a/full_models/pil/config.json b/full_models/pil/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pil/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pil/vocab.txt b/full_models/pil/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9a699ac5028709ffbe97a3946620c9b0ebbe22a9 --- /dev/null +++ b/full_models/pil/vocab.txt @@ -0,0 +1,40 @@ + +w +ò +f +t +d +v +p +u +g +- +ɛ +z +ə +n +à +c +r +ì +è +ʋ +k +ɣ +b +ɔ +h +̀ +m +l +y +e +i +_ +j +ǝ +o +s +ŋ +a +ù diff --git a/full_models/pir/D_100000.pth b/full_models/pir/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e9b9a1b5a89fabdb8f2c0e1d89a6f20f49149c64 --- /dev/null +++ b/full_models/pir/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7016c7abc92b250186ff518f47ac4cd202e1e7135a9cd24c3b845a44d7fd083 +size 561076930 diff --git a/full_models/pir/G_100000.pth b/full_models/pir/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3b7275162cf14ce7c3de6eaa68374112c7b730ef --- /dev/null +++ b/full_models/pir/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aebbd3eb27820c5e30bb3ba445fe489191dcc58dd585882deb7bdaacadf79628 +size 436391857 diff --git a/full_models/pir/config.json b/full_models/pir/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pir/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pir/vocab.txt b/full_models/pir/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..19d8e8deb2a1b664fd02bba1cee175ea9f25684e --- /dev/null +++ b/full_models/pir/vocab.txt @@ -0,0 +1,44 @@ +| +a +i +e +r +o +h +ʉ +u +t +n +y +s +c +q +m +j +p +d +̃ +g +ñ +ã +b +w +ẽ +ũ +l +õ +ĩ +— +í +f +v +é +z +á +ú +' +ó +k +x +́ + diff --git a/full_models/pis/D_100000.pth b/full_models/pis/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..031c81a61cbf8f33739b53d5f714c18b460b0dec --- /dev/null +++ b/full_models/pis/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa05484733aebbde0cda14e9d6b9acc09ad5a75ae11c737279af6f3655541fb +size 561078632 diff --git a/full_models/pis/G_100000.pth b/full_models/pis/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d693e3e8554c9f0d47f207bdc173465aa9ff4b93 --- /dev/null +++ b/full_models/pis/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c00ec5e879c455ac125a510fba6e27c0e18fb1a4c4253b54c10394e8d8cff1f2 +size 436373669 diff --git a/full_models/pis/config.json b/full_models/pis/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pis/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pis/vocab.txt b/full_models/pis/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..36fcd317e4e247b05c236c2f4fd91d13a1bb212d --- /dev/null +++ b/full_models/pis/vocab.txt @@ -0,0 +1,36 @@ +| +a +e +o +m +i +n +l +t +s +g +k +f +h +u +b +d +r +p +y +w +v +j +- +0 +' +1 +2 +4 +9 +5 +6 +3 +7 +8 + diff --git a/full_models/pjt/D_100000.pth b/full_models/pjt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..47c6c803d9767d83d7076219bf745445d62bbcc5 --- /dev/null +++ b/full_models/pjt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80757041e1f58cc85a57c409e653821d88db5a7fea44a29db8b78625fea96725 +size 561076197 diff --git a/full_models/pjt/G_100000.pth b/full_models/pjt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eaa947cb829052ffac7ae6b002249829e3a6e9eb --- /dev/null +++ b/full_models/pjt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bfe553901d50c35a71730d2165daba20439c58dd8362d8b36e2cdc4448c5ad5 +size 436376358 diff --git a/full_models/pjt/config.json b/full_models/pjt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pjt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pjt/vocab.txt b/full_models/pjt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9a71741b676d501f9f79b7b879a268d154c82130 --- /dev/null +++ b/full_models/pjt/vocab.txt @@ -0,0 +1,45 @@ +y +d +m +v +c +z +6 +ḻ +4 +— +b +_ +p +' +3 +ṟ +ṉ +9 +5 +– +s +w +8 +h +l +o +g +x +1 +u +- +n +f +ṯ +r + +2 +0 +e +j +t +7 +i +k +a diff --git a/full_models/pkb/D_100000.pth b/full_models/pkb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5b36681d93b8e488be505dd408b20dbdb1b822af --- /dev/null +++ b/full_models/pkb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6b5f493ea2a5b3971166a99beafe076eb2da887277040bfaaa1e4d8e417778 +size 561078625 diff --git a/full_models/pkb/G_100000.pth b/full_models/pkb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3378b1ef9986a7074d72ab9f5a1e76922597eb44 --- /dev/null +++ b/full_models/pkb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90537fb46d108b4c6f9d160083d1ebf3112cdd56a57f94651a790f72a2f66db +size 436371134 diff --git a/full_models/pkb/config.json b/full_models/pkb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pkb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pkb/vocab.txt b/full_models/pkb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..751869886f7702197f62c706225139929fe8c9cf --- /dev/null +++ b/full_models/pkb/vocab.txt @@ -0,0 +1,35 @@ +a +| +u +i +n +w +e +k +m +y +o +h +s +d +z +t +g +b +̯ +r +v +f +j +l +p +ḍ +c +ḅ +- +0 +1 +4 +2 +' + diff --git a/full_models/pls/D_100000.pth b/full_models/pls/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..acbff883a06d1131f47b14adc07f57affca4c7cc --- /dev/null +++ b/full_models/pls/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f8841cbe43d109f91178e6feae6a43311e05b25fb1ea6a33a4dbe9c8e470d4 +size 561079376 diff --git a/full_models/pls/G_100000.pth b/full_models/pls/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6420cac6f183b892a88c0655114b2a54889a3bd1 --- /dev/null +++ b/full_models/pls/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a23997864398e74556db5b307a92c3f6afa2b7ec02fe7b3b9b5ace61b5be67f +size 436398846 diff --git a/full_models/pls/config.json b/full_models/pls/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pls/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pls/vocab.txt b/full_models/pls/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2c8d8a794cc12a09a0e3f0a930f4165832d93b68 --- /dev/null +++ b/full_models/pls/vocab.txt @@ -0,0 +1,45 @@ +7 + +a +6 +4 +t +m +l +s +e +k +- +q +_ +x +b +ꞌ +' +3 +1 +ú +r +z +g +p +v +d +o +u +̱ +í +0 +i +f +ó +y +h +é +c +n +2 +— +ñ +á +j diff --git a/full_models/plw/D_100000.pth b/full_models/plw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ee0742d6ded126c8d262fab08ae988613bbffe47 --- /dev/null +++ b/full_models/plw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ad1174794319d19fae5336a592d18194b3841f16267ed8d3c1f3eca98479ab +size 561079024 diff --git a/full_models/plw/G_100000.pth b/full_models/plw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fb56641d413ecc524d52f97ec3d3cb3051d09ff8 --- /dev/null +++ b/full_models/plw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b605a260323ad925e648942d54a24592e4b1129734cfa0584efa539957e4c043 +size 436365600 diff --git a/full_models/plw/config.json b/full_models/plw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/plw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/plw/vocab.txt b/full_models/plw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4cc9696828e3841fdfb4f8cc567e7f6853526ec9 --- /dev/null +++ b/full_models/plw/vocab.txt @@ -0,0 +1,31 @@ +i +a +3 +t +6 +ʼ +' + +4 +p +1 +- +w +h +n +k +u +y +r +2 +d +g +b +s +e +m +j +_ +l +0 +o diff --git a/full_models/pmf/D_100000.pth b/full_models/pmf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..11e5107cca8b092e45ba6732ce3450f585ca6e62 --- /dev/null +++ b/full_models/pmf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5b568425ab8dcf7795a4269e7a3d27bb4b61f91d8117cb5bbd3cf991e50afb2 +size 561076184 diff --git a/full_models/pmf/G_100000.pth b/full_models/pmf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..91654d79e55787647368d2244ec3ee9fded48ba9 --- /dev/null +++ b/full_models/pmf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224980d4b55ae2b2e04e3c5db8c4fda4768efc36c16c5e0254e01fa238dccfac +size 436335269 diff --git a/full_models/pmf/config.json b/full_models/pmf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pmf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pmf/vocab.txt b/full_models/pmf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6386f1baecd988aa572c141acaef4895a1179a1e --- /dev/null +++ b/full_models/pmf/vocab.txt @@ -0,0 +1,27 @@ +a +| +o +i +n +m +e +t +u +k +s +p +r +g +l +y +w +' +b +d +j +h +- +z +c +f + diff --git a/full_models/pny/D_100000.pth b/full_models/pny/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b54570300b808eb96c93fd579eae58065d15cc3 --- /dev/null +++ b/full_models/pny/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86bb4622c878ea0c49d83c38a669b2fb19d6ecdcc700768e97fc7d2225a027cb +size 561078624 diff --git a/full_models/pny/G_100000.pth b/full_models/pny/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..fbb1cd99edd70fd91135e6fca0e9e691bc35e929 --- /dev/null +++ b/full_models/pny/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e935b9c9f403d848a75f7487b4ee269a7136960c2c93e366b3af0181fd45ab5e +size 436417343 diff --git a/full_models/pny/config.json b/full_models/pny/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pny/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pny/vocab.txt b/full_models/pny/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f061ca8f2138a31cb3a97c30c46140faa44a9e57 --- /dev/null +++ b/full_models/pny/vocab.txt @@ -0,0 +1,55 @@ +| +ə +̀ +n +ɨ +a +m +p +à +t +w +l +h +o +ŋ +u +b +s +ù +ʼ +g +k +y +i +r +z +e +ò +ẅ +d +̂ +è +f +ì +c +â +ô +ǎ +j +û +ě +̌ +ǹ +ǔ +î +ǐ +v +' +ǒ +x +q +- +1 +2 + diff --git a/full_models/poh-dialect_eastern/D_100000.pth b/full_models/poh-dialect_eastern/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..71b8b0f22336a74c534f50953a7c771548e37de0 --- /dev/null +++ b/full_models/poh-dialect_eastern/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6c41d50a52f1aa1b0ad96a23ed9ac33cc563bfbe4e8b10b7fff1679c2698e4 +size 561076199 diff --git a/full_models/poh-dialect_eastern/G_100000.pth b/full_models/poh-dialect_eastern/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..95321c10c15b49cade98f422f14499d70640f2af --- /dev/null +++ b/full_models/poh-dialect_eastern/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2e16d512a37e38413f95ecc9b0cced7fcb5baa9df401feb0caefbeeeaf1e7db +size 436358196 diff --git a/full_models/poh-dialect_eastern/config.json b/full_models/poh-dialect_eastern/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/poh-dialect_eastern/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/poh-dialect_eastern/vocab.txt b/full_models/poh-dialect_eastern/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9c3ba23ee9b6e350b1659430710048d09b5d0823 --- /dev/null +++ b/full_models/poh-dialect_eastern/vocab.txt @@ -0,0 +1,37 @@ +h +e +p +ó +á +ú +— + +y +_ +l +a +r +u +b +í +f +' +m +v +g +w +é +q +z +- +j +k +i +s +ñ +c +d +x +t +o +n diff --git a/full_models/poh-dialect_western/D_100000.pth b/full_models/poh-dialect_western/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3817adf36436223b043f18ea62b9c45dd5d710a --- /dev/null +++ b/full_models/poh-dialect_western/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91bd9ca4cb2afb70127cb8a05645bccb966e5022fa3369d5c8cad72fd6bc5312 +size 561076159 diff --git a/full_models/poh-dialect_western/G_100000.pth b/full_models/poh-dialect_western/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2cf647587de99fcee608483af0f90b14ef60e42e --- /dev/null +++ b/full_models/poh-dialect_western/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc3da13bcb1cd95b8eeda973544150c81e7b2d248b087df0779d01d3f276cb9c +size 436339008 diff --git a/full_models/poh-dialect_western/config.json b/full_models/poh-dialect_western/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/poh-dialect_western/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/poh-dialect_western/vocab.txt b/full_models/poh-dialect_western/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..20b5816d3a187c5934879750db24ae9321b9ffb8 --- /dev/null +++ b/full_models/poh-dialect_western/vocab.txt @@ -0,0 +1,29 @@ +| +i +a +ꞌ +c +h +e +r +n +o +j +k +u +l +t +w +̱ +m +b +x +s +q +p +y +d +- +z +— + diff --git a/full_models/poi/D_100000.pth b/full_models/poi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1be8d88853623b981a0e6d63ff6dccb2ed3802fa --- /dev/null +++ b/full_models/poi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f33f403d4550c81b8112e356cedb46a172180cbf905be6953d57138a325c989 +size 561078078 diff --git a/full_models/poi/G_100000.pth b/full_models/poi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa1606d47d5609ae1e6faa7b520aa8ad0cdd88c9 --- /dev/null +++ b/full_models/poi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628d6430eee95fac3b4e679cac785a32c121357519c696e6bcf7468f0a002c5d +size 436375804 diff --git a/full_models/poi/config.json b/full_models/poi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/poi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/poi/vocab.txt b/full_models/poi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cf9f9ce431e65ca7cc4ee2a15a1df82a25b44225 --- /dev/null +++ b/full_models/poi/vocab.txt @@ -0,0 +1,39 @@ +ñ +e +q +r +i +w +x +́ +é +f +_ +b +k +a +̱ + +v +g +d +s +o +y +á +p +m +í +ŋ +l +ó +n +ú +j +z +- +t +ɨ +c +h +u diff --git a/full_models/pol/D_100000.pth b/full_models/pol/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..16026a7c6079539846be1c710eac22f88bcb327d --- /dev/null +++ b/full_models/pol/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb88d69da204287cf7e3a417a5c65ba30766f94c4dd151b708373bd1c359b8a5 +size 561078992 diff --git a/full_models/pol/G_100000.pth b/full_models/pol/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..b56300ef72d9c4d316e18af8a9f597701a134cd8 --- /dev/null +++ b/full_models/pol/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0fc25fbe85a53fd1255e29d1b9716f36b9c5fab27f98ca3d351aa9fe6d11aeb +size 436400472 diff --git a/full_models/pol/config.json b/full_models/pol/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pol/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pol/vocab.txt b/full_models/pol/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ae470fc39a84be58abbf33aca29a961071b2cd7a --- /dev/null +++ b/full_models/pol/vocab.txt @@ -0,0 +1,46 @@ +w +h + +l +0 +c +m +ą +s +z +u +d +2 +ń +ó +4 +g +f +1 +p +9 +— +e +6 +- +k +b +8 +r +a +5 +_ +ę +y +ł +i +ż +j +o +3 +7 +n +t +ś +ć +ź diff --git a/full_models/por/D_100000.pth b/full_models/por/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..199fb8dc5b411e6b6a6673be30db165909c09f2b --- /dev/null +++ b/full_models/por/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06704db25aef03b34f499deaa345f34331c61f2642d53f207baca0d7ba283547 +size 561110491 diff --git a/full_models/por/G_100000.pth b/full_models/por/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e5c9ea8a5a53e08773eb8acd062b1673c82f1585 --- /dev/null +++ b/full_models/por/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffd5451f584644f405377b181f1eba19fcddf081a4fee6dd5e691ec7e2a08dcd +size 436631920 diff --git a/full_models/por/config.json b/full_models/por/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/por/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/por/vocab.txt b/full_models/por/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..31889ac32737d53b54aa138b481be6befe6d4bd8 --- /dev/null +++ b/full_models/por/vocab.txt @@ -0,0 +1,43 @@ +à +ú +1 +u +l +2 +h +é +p +ã +x +' +ê +_ +s +ç +4 +v +m +- +g +q +c +z +â +í +t +e +o +i +f +b + +r +ô +n +— +ó +a +j +d +õ +á diff --git a/full_models/poy/D_100000.pth b/full_models/poy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..67a7c6ac496f99d8b26fa854ef1965136db301c9 --- /dev/null +++ b/full_models/poy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f96a2490bf3b89d326f4ebde385d1971657d8bbe7333fde54d4728c357a65be +size 561079129 diff --git a/full_models/poy/G_100000.pth b/full_models/poy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1b2795b5724e3d6d0be1f15ca6247ed519e0b76e --- /dev/null +++ b/full_models/poy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5865a6c3d19230fa95c6515a101d52bc8f0252ee8faa764b4cd0f7bfe637b6cc +size 436357407 diff --git a/full_models/poy/config.json b/full_models/poy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/poy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/poy/vocab.txt b/full_models/poy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fc45d57877c52dbc2a9a7317b630fe51df900504 --- /dev/null +++ b/full_models/poy/vocab.txt @@ -0,0 +1,27 @@ +u +a +' +t +p +g +n +e +k +y +z +s +_ +f + +r +l +v +i +j +b +m +h +o +c +w +d diff --git a/full_models/ppk/D_100000.pth b/full_models/ppk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..19adb624a774135df04c088d9925e3609ab7da77 --- /dev/null +++ b/full_models/ppk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b397854e5450a6d14cf0a66ac9e526706b18e3c7cdc6be8f7f7c50c742b7a0e +size 561079090 diff --git a/full_models/ppk/G_100000.pth b/full_models/ppk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..202362b6196b3d9b52e4ac034909ca0289f3866c --- /dev/null +++ b/full_models/ppk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac42e76a983d13e23d13c18d3119b0f421f2fa97af7498a092bee03270d283ca +size 436358387 diff --git a/full_models/ppk/config.json b/full_models/ppk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ppk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ppk/vocab.txt b/full_models/ppk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3c1681b9963f8893d213c87875802b4cec4e1e34 --- /dev/null +++ b/full_models/ppk/vocab.txt @@ -0,0 +1,28 @@ +u +c +_ +y +a +e +s +d +l +b +p +k +f +r +i +t +o +j +g +m + +- +z +– +h +n +w +' diff --git a/full_models/pps/D_100000.pth b/full_models/pps/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..90b9b0e556c87df84b11713d04b9509ea7cc2cf6 --- /dev/null +++ b/full_models/pps/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f54ad0cf562d38b6d1ad85b408862f77df1cfd46acd3f87810f095e46bb6b59a +size 561079381 diff --git a/full_models/pps/G_100000.pth b/full_models/pps/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..72cf5c9bfd9cee6d4f020c736d67948bff3e067f --- /dev/null +++ b/full_models/pps/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e26cbf22c15387797e1317587abe0262e1fa9fdb79098367618c1874dbbb85f +size 436401027 diff --git a/full_models/pps/config.json b/full_models/pps/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pps/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pps/vocab.txt b/full_models/pps/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f8e8bd17606dc09de49e1614cb97c7acf5add74f --- /dev/null +++ b/full_models/pps/vocab.txt @@ -0,0 +1,46 @@ +o +' +j +r +1 +t +_ +x +ó +ì +d +` +m +g +i +ú +à +h +u +n + +p +e +9 +l +— +c +ꞌ +k +f +q +ñ +s +z +y +- +b +2 +̱ +í +5 +a +á +v +ù +é diff --git a/full_models/prf/D_100000.pth b/full_models/prf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6b53bb27c04daa1265268e3920171ce2df80abf3 --- /dev/null +++ b/full_models/prf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ff6aa2a7960ea5259b8dff76e93f59bce38e1f6b40c6771b181748e900c141 +size 561078625 diff --git a/full_models/prf/G_100000.pth b/full_models/prf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c6c19dce90d9d3e1ac2a5da6226363859d4e8eb0 --- /dev/null +++ b/full_models/prf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f5bedf79a409d1ea45be329773e5dd87d708bf36ed01b4b8793dc7466f95d2 +size 436373683 diff --git a/full_models/prf/config.json b/full_models/prf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/prf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/prf/vocab.txt b/full_models/prf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8dc53454c09f3fe3fe1198df7053dc40ecd204d1 --- /dev/null +++ b/full_models/prf/vocab.txt @@ -0,0 +1,36 @@ +| +a +n +i +t +k +e +u +d +y +m +g +s +p +l +o +á +b +h +r +w +j +- +c +' +f +z +v +q +0 +1 +2 +x +4 +6 + diff --git a/full_models/prk/D_100000.pth b/full_models/prk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c67d33912d0715c07c784e82a3474d137d78220c --- /dev/null +++ b/full_models/prk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7e3fb454cc96ed36f3fa184fac0dc1e0824001a75a23f091cb0aa7cd38389d1 +size 561079234 diff --git a/full_models/prk/G_100000.pth b/full_models/prk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ed3dfeffd37fa1e785db721486dacc71f58197d --- /dev/null +++ b/full_models/prk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403f86713cce56e459faf84f8991eef4341f384b88b2742adc6aeb92603afe00 +size 436369475 diff --git a/full_models/prk/config.json b/full_models/prk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/prk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/prk/vocab.txt b/full_models/prk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cbac670720ee1a7b7cdd5c2f823319c9b2f1811f --- /dev/null +++ b/full_models/prk/vocab.txt @@ -0,0 +1,32 @@ +r +j +d +p +h +k +w +- +t +i +6 +e +u +9 +2 +s +n +o +a + +_ +l +m +c +y +v +f +g +x +z +4 +b diff --git a/full_models/prt/D_100000.pth b/full_models/prt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4c9499211977cb04f7f567122de9f46ca2f65fef --- /dev/null +++ b/full_models/prt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca179a74743fa53f44b4a2b92fba98cd94e1b6f973b089fb525c65f61a7e8076 +size 561078503 diff --git a/full_models/prt/G_100000.pth b/full_models/prt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c1aae01c33943fb133c0d953778d87e5da91c0a2 --- /dev/null +++ b/full_models/prt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b41ca6a617e8c35ca7c47e1c9457106e4754f347b3b7e8e46a2c22ba321fa8 +size 436417223 diff --git a/full_models/prt/config.json b/full_models/prt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/prt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/prt/vocab.txt b/full_models/prt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..437d201f11798cfd9b853e20ee74af5bfcdc28ba --- /dev/null +++ b/full_models/prt/vocab.txt @@ -0,0 +1,55 @@ +1 +6 +้ +_ +‍ +ร +ญ +อ +ั +ป +พ +ื +น +จ +ฟ +ค +ท +ุ +บ +ไ +ว +0 +ใ +แ +ง +3 +5 +๊ +ะ +ย +9 +4 +า +ี +ก +ฮ +ห +ต + +ิ +ู +็ +ด +8 +ึ +เ +2 +7 +- +ํ +' +ล +โ +ซ +ม diff --git a/full_models/pse/D_100000.pth b/full_models/pse/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bb52acf6060dafe29e99ed3a73134b5d2c7c9237 --- /dev/null +++ b/full_models/pse/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908ac850904303bcddc54d6638e2bfa7bd151a42e8a9b12d10e496d2dc5de0d2 +size 561079130 diff --git a/full_models/pse/G_100000.pth b/full_models/pse/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6184caa470fe55114b8b529350f95edc8d02ab0c --- /dev/null +++ b/full_models/pse/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eaf893149e2709f2455439e64044aea21be355bf9cefd8a2178b9c91e316e89 +size 436350344 diff --git a/full_models/pse/config.json b/full_models/pse/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pse/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pse/vocab.txt b/full_models/pse/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1eee4de7a8322e21ae66548486e90082d3a091f2 --- /dev/null +++ b/full_models/pse/vocab.txt @@ -0,0 +1,24 @@ +h +d +j +g +b +i +- +n +c +w +p +' +m +e +a +k +s + +u +r +y +_ +l +t diff --git a/full_models/pss/D_100000.pth b/full_models/pss/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fd697b15b4becd54b41f083ca11b8edd38b2abfa --- /dev/null +++ b/full_models/pss/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:342163bceac8c896ccc625078a800f489f5c22f01e27461b0e45634636e44de2 +size 561078768 diff --git a/full_models/pss/G_100000.pth b/full_models/pss/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3526fb4d24e2a590d961631bdade58bb87e7bcb9 --- /dev/null +++ b/full_models/pss/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8a9cdae3f164f1e6b4217959c4ca0640e5ef280c4fbf2e45758a89457fa348a +size 436348153 diff --git a/full_models/pss/config.json b/full_models/pss/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pss/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pss/vocab.txt b/full_models/pss/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a2824824c78a21736211c471202f96dacb7a6773 --- /dev/null +++ b/full_models/pss/vocab.txt @@ -0,0 +1,24 @@ +g +t +a +p +o +u +y +n +k +' +s +h +l +d +m +e +– +- +r + +i +w +b +_ diff --git a/full_models/ptu/D_100000.pth b/full_models/ptu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4909ec8072a3992690c381d23760651af95a21ec --- /dev/null +++ b/full_models/ptu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a63e835560fde89f6a4bdd3497952cbd1a0f643a0945a8f032635044f9ad62fe +size 561078584 diff --git a/full_models/ptu/G_100000.pth b/full_models/ptu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7a4a9e9c42e14fd9fdeb5e96097221f5a3a8cae0 --- /dev/null +++ b/full_models/ptu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d70846de0cd6a284239ab66f67954c39c66f2a43dfc34f341b93dd5b6b9c6969 +size 436355229 diff --git a/full_models/ptu/config.json b/full_models/ptu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ptu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ptu/vocab.txt b/full_models/ptu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..81bfdd3534ff1d9c4e5a0ff92d43f50c62c001e9 --- /dev/null +++ b/full_models/ptu/vocab.txt @@ -0,0 +1,28 @@ +a +| +n +i +u +m +l +o +t +s +' +k +e +p +d +g +b +h +ä +y +- +r +j +w +f +z +c + diff --git a/full_models/pui/D_100000.pth b/full_models/pui/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d2c4b879b664f45250806bc81d3006735d0a2056 --- /dev/null +++ b/full_models/pui/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc14da8b65c047a1ec87c2d5f272b668b1542bca76b13ee23d0adf432db1765 +size 561079093 diff --git a/full_models/pui/G_100000.pth b/full_models/pui/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..95479e821264ecabe2eeaa5af781dd94e3e1a7ee --- /dev/null +++ b/full_models/pui/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb6496588bd4fb86fed6a330c01adfe11ccf8b59e88b7763f6e772b961d9e85d +size 436392561 diff --git a/full_models/pui/config.json b/full_models/pui/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pui/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pui/vocab.txt b/full_models/pui/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c28dfad4f2ea9e3b11a78e743fc28b5528722fef --- /dev/null +++ b/full_models/pui/vocab.txt @@ -0,0 +1,42 @@ +í +0 +ü +á +m +_ +n +d +x +ó +p +a +k +2 +h +j +y +l +b +ú +t +v +ñ +é +ŕ +z +o +w +q +- +4 +e +7 + +i +u +f +c +g +9 +s +r diff --git a/full_models/pwg/D_100000.pth b/full_models/pwg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b13f8e430ffe0d0a111f25390e9f886fc11b670 --- /dev/null +++ b/full_models/pwg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac834084a971a1bfa8ef6c91c30490be9b5340c9d1fb700c522536daeee43f4 +size 561078366 diff --git a/full_models/pwg/G_100000.pth b/full_models/pwg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..98606eacfa0f72c2f3909f87187114db2fddae48 --- /dev/null +++ b/full_models/pwg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09a3d6cd153b4217b249a6460341d267ed86ffdc5f8afbe53888107354c29c4 +size 436378057 diff --git a/full_models/pwg/config.json b/full_models/pwg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pwg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pwg/vocab.txt b/full_models/pwg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a690f3136627040906d2317ad88a6d61c3528d16 --- /dev/null +++ b/full_models/pwg/vocab.txt @@ -0,0 +1,38 @@ +s +4 +b +e +x +7 +1 +' +d +p +c +9 +6 +w +h +0 +j +u +m + +3 +n +_ +5 +y +t +f +r +g +k +l +8 +v +o +z +i +a +2 diff --git a/full_models/pww/D_100000.pth b/full_models/pww/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..034e3b82c801bb6e3e1127cf0e2ab159d9ffa0b1 --- /dev/null +++ b/full_models/pww/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f7ff25f6c68589b0bc332cbea8568402e7dc183ded7fe4b9a4488cebbe4e4b +size 561078577 diff --git a/full_models/pww/G_100000.pth b/full_models/pww/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..000d55cbce332ddd998664f42696b165a292d8d5 --- /dev/null +++ b/full_models/pww/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9ec52e05bc4c30a3aca07d10911f6ca3e2a04614f018c544d7c620af4c6bbd +size 436396722 diff --git a/full_models/pww/config.json b/full_models/pww/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pww/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pww/vocab.txt b/full_models/pww/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c86d694873312bca0a73c72f885e3d91e770a467 --- /dev/null +++ b/full_models/pww/vocab.txt @@ -0,0 +1,46 @@ +| +้ +ง +อ +ล +เ +แ +่ +๊ +ี +า +ะ +น +ท +พ +ม +ซ +ก +โ +ว +ู +บ +ฌ +ด +ย +ไ +ค +ช +จ +ื +ุ +ฆ +ิ +- +ึ +ป +ต +ร +ฮ +' +ฟ +ั +1 +ส +ผ + diff --git a/full_models/pxm/D_100000.pth b/full_models/pxm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9c02af46c47d704f01331ca8ad7c6d97d5f5be78 --- /dev/null +++ b/full_models/pxm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c0162370e418dd0b55067933035e8b0d668482fcbc14b0039eec9ab48696fd +size 561078093 diff --git a/full_models/pxm/G_100000.pth b/full_models/pxm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b9122b1f490966acaa4f2d6e842d8b9582e8e97d --- /dev/null +++ b/full_models/pxm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8c60dd91483029ab18fe6e1d92fb96b6b85ed2f2aa4209ff24f6e4b74693b7 +size 436372216 diff --git a/full_models/pxm/config.json b/full_models/pxm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/pxm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/pxm/vocab.txt b/full_models/pxm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..48f736ccf3ca08681bc6a7baf08db7081bdd160e --- /dev/null +++ b/full_models/pxm/vocab.txt @@ -0,0 +1,37 @@ +n +e +g +t +w +h +m +l +b +k +_ +o +j +x +d +v +á +ó +f +é +u +í +ú +ñ +z + +c +' +s +ë +p +a +ä +i +y +q +r diff --git a/full_models/qub/D_100000.pth b/full_models/qub/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..036693905de963caec801e7fab6fb721f11fd189 --- /dev/null +++ b/full_models/qub/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed4459a9e919ed299012df77d9ba3ccb49b9a0c14071bdc53872dbcaec115cc +size 561078619 diff --git a/full_models/qub/G_100000.pth b/full_models/qub/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cfc15abe3bcaca02b8a28e644ba0037e8ae4719a --- /dev/null +++ b/full_models/qub/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04998dc24c76796b3fc9e8e5144527bc84b1fd7013bfe67690864c133f923440 +size 436385337 diff --git a/full_models/qub/config.json b/full_models/qub/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qub/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qub/vocab.txt b/full_models/qub/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cecd43b47d3cf442ae6ea5779977db34119fad71 --- /dev/null +++ b/full_models/qub/vocab.txt @@ -0,0 +1,41 @@ +a +| +n +c +i +u +h +y +s +r +m +t +p +l +j +g +o +w +ä +e +q +d +ö +b +ñ +ï +ë +- +f +ú +ü +í +é +z +v +ó +á +' +x +k + diff --git a/full_models/quc-dialect_central/D_100000.pth b/full_models/quc-dialect_central/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3950e95eeb1f5d858fa53a2d733cf600d3dcf8f7 --- /dev/null +++ b/full_models/quc-dialect_central/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108b0a6014fc0da816e4d629b6053e0d78d76f662f0abc31f52a24357a7359ca +size 561077736 diff --git a/full_models/quc-dialect_central/G_100000.pth b/full_models/quc-dialect_central/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cd78f741cbd50985de763605e15fb1ff29619acf --- /dev/null +++ b/full_models/quc-dialect_central/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a67488377a157d9e4c19d8e6e2aec91923aa8accdc1eb08b9c45ac5fd1a7a5 +size 436365933 diff --git a/full_models/quc-dialect_central/config.json b/full_models/quc-dialect_central/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quc-dialect_central/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quc-dialect_central/vocab.txt b/full_models/quc-dialect_central/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d943b3558ab17879eec4ff4ad633a879e5a5070e --- /dev/null +++ b/full_models/quc-dialect_central/vocab.txt @@ -0,0 +1,37 @@ +| +i +a +c +r +u +e +ꞌ +j +n +h +t +o +l +k +x +m +w +b +s +q +ä +p +z +d +y +— +ú +í +g +é +á +ó +v +f +ñ + diff --git a/full_models/quc-dialect_east/D_100000.pth b/full_models/quc-dialect_east/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..40fefb43a5961efa698f3385630442235d731112 --- /dev/null +++ b/full_models/quc-dialect_east/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57567ac3f1f08c462c784bc2434d7911e75442ec1fa57ab1679b66d353e33535 +size 561078628 diff --git a/full_models/quc-dialect_east/G_100000.pth b/full_models/quc-dialect_east/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..453a2386b5b8930708ead027801dcf6e1321fcd0 --- /dev/null +++ b/full_models/quc-dialect_east/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa0c57d85a1d218fff1dd67815eef60736a39a5c7df53247ab0c60558b3fe14 +size 436391836 diff --git a/full_models/quc-dialect_east/config.json b/full_models/quc-dialect_east/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quc-dialect_east/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quc-dialect_east/vocab.txt b/full_models/quc-dialect_east/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3dea07a59512f3316b097b4fea9f1f018dbb89bf --- /dev/null +++ b/full_models/quc-dialect_east/vocab.txt @@ -0,0 +1,43 @@ +| +a +i +r +k +e +' +u +j +h +c +n +t +l +o +q +w +b +x +m +s +p +y +z +d +g +f +– +v +- +ä +1 +0 +2 +6 +4 +7 +ñ +5 +3 +8 +— + diff --git a/full_models/quc-dialect_north/D_100000.pth b/full_models/quc-dialect_north/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bbab655e705652ce4e1c049640c1e1ba54fcdd10 --- /dev/null +++ b/full_models/quc-dialect_north/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b42ae1faabc11d21690f18f02213a4df7ee6bf11fc1c5c43bcc8124e992a2c3 +size 561077845 diff --git a/full_models/quc-dialect_north/G_100000.pth b/full_models/quc-dialect_north/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..59cc84acf6a35b4995aa3534deb3ee28a8db7008 --- /dev/null +++ b/full_models/quc-dialect_north/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b54843ba7abf4a4b3cd2540a7cf6fd01a76a31d181ab7d8dece11daa72116456 +size 436363466 diff --git a/full_models/quc-dialect_north/config.json b/full_models/quc-dialect_north/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quc-dialect_north/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quc-dialect_north/vocab.txt b/full_models/quc-dialect_north/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..aa3a33a3dd9bf8963b7d490d6e838ced37d0a8a2 --- /dev/null +++ b/full_models/quc-dialect_north/vocab.txt @@ -0,0 +1,35 @@ +| +a +' +i +k +j +e +c +h +l +u +n +r +q +o +t +x +m +b +w +s +p +y +z +d +ú +é +g +ó +í +f +v +á +ñ + diff --git a/full_models/quf/D_100000.pth b/full_models/quf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f3750e1b6ba43fe9f46b68830db8fca44de29df --- /dev/null +++ b/full_models/quf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20ce5692ef0697663d22c1368a9fb77777001cc55ccab23f05dc9027cbf1697 +size 561078450 diff --git a/full_models/quf/G_100000.pth b/full_models/quf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e32464bdbcead9a770bc364302c60fe4d9e67d7c --- /dev/null +++ b/full_models/quf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdb455fcc19c8cf6b826b645331ff22156588565db0c5931d2cc11ad2c991789 +size 436371389 diff --git a/full_models/quf/config.json b/full_models/quf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quf/vocab.txt b/full_models/quf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9460af971389f2367eadeee1205fd35f0136e730 --- /dev/null +++ b/full_models/quf/vocab.txt @@ -0,0 +1,35 @@ +a +| +n +i +u +k +y +l +h +p +m +r +q +s +t +c +w +d +' +e +j +b +g +- +o +ñ +f +v +z +0 +x +1 +2 +4 + diff --git a/full_models/quh/D_100000.pth b/full_models/quh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..96699495e7a12a44c7553ced8dc6eabe26300140 --- /dev/null +++ b/full_models/quh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe37c83c907179966bb1f40c1c37c088d33060b9526505160b30b1426ee1012 +size 561078255 diff --git a/full_models/quh/G_100000.pth b/full_models/quh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82454d8a59c87e16eace1468cfac6c03da62853a --- /dev/null +++ b/full_models/quh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2b79fad4241d7033f25591d75021295d229274483f5a58188d68e7f17a7f89 +size 436386104 diff --git a/full_models/quh/config.json b/full_models/quh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quh/vocab.txt b/full_models/quh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c761076488811d7cd812ec312467a4ba979cc3a1 --- /dev/null +++ b/full_models/quh/vocab.txt @@ -0,0 +1,43 @@ +z +á +a +ñ +l +h +t +p +o +g +2 + +d +5 +w +ú +k +é +1 +6 +4 +y +0 +f +n +c +v +' +e +í +i +x +b +_ +j +3 +q +ó +r +u +s +m +7 diff --git a/full_models/qul/D_100000.pth b/full_models/qul/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..855cf31a8af9d0f3897de48e4ff3d80dfecc3516 --- /dev/null +++ b/full_models/qul/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c47c2fa7c6e138e4dc690cb9b6683afafc61704879d8978acb628cf10737f1 +size 561078640 diff --git a/full_models/qul/G_100000.pth b/full_models/qul/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f08759bc2817586890bf8ed79b7e8f08b78eedc --- /dev/null +++ b/full_models/qul/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55eae1f233f3f61fa029bbfc8091227e6a9607730e784552e6026939a8a3b6a6 +size 436378177 diff --git a/full_models/qul/config.json b/full_models/qul/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qul/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qul/vocab.txt b/full_models/qul/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ec40aa38649c907d4b2d6ba481472575090f470c --- /dev/null +++ b/full_models/qul/vocab.txt @@ -0,0 +1,38 @@ +a +| +n +i +u +q +k +h +c +m +y +s +p +t +r +l +w +j +' +o +e +d +ñ +– +b +g +f +í +é +v +ó +ä +z +ú +á +ï +x + diff --git a/full_models/quw/D_100000.pth b/full_models/quw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1c52d1c8bed46df0c30c2bcd2d5d7a135afeb600 --- /dev/null +++ b/full_models/quw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd273e1b294d1dac4fc18e0b5d2ed32913e00568b13a7fb8b064342df8a41190 +size 561078727 diff --git a/full_models/quw/G_100000.pth b/full_models/quw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2031a375141923419bccb185540bb3b39c1fd5fc --- /dev/null +++ b/full_models/quw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d8b644088906fd6dd5c16a0fcb5698668ee5ab108d030fd325b1ea1a6e3bc48 +size 436395066 diff --git a/full_models/quw/config.json b/full_models/quw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quw/vocab.txt b/full_models/quw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bb376ccd885b545481957d15718611675da2c350 --- /dev/null +++ b/full_models/quw/vocab.txt @@ -0,0 +1,44 @@ +a +| +i +u +n +c +h +s +r +m +p +l +t +g +j +d +y +ñ +o +e +q +b +z +v +ú +f +í +ź +é +ü +á +ó +0 +1 +2 +x +ï +— +' +k +- +ä +ḿ + diff --git a/full_models/quy/D_100000.pth b/full_models/quy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..347993e80e872dcd09e9cfe01911b8cdec86e942 --- /dev/null +++ b/full_models/quy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94896dbd432aa537325a0de941d175b406976d2699fd2170c1c681b3dbbddc8e +size 561078216 diff --git a/full_models/quy/G_100000.pth b/full_models/quy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..93c3b036c2dbe2e7df8ed85a8647878866aeca97 --- /dev/null +++ b/full_models/quy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3da1fea8b96bd32cf47c351b42f3cecdcb64ed85622ed24c76b064605b6a512 +size 436371031 diff --git a/full_models/quy/config.json b/full_models/quy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quy/vocab.txt b/full_models/quy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..aa07815af12eb9d107e6a50fcd33850372a5aa66 --- /dev/null +++ b/full_models/quy/vocab.txt @@ -0,0 +1,36 @@ +a +_ +o +g +s +f +w +z +c +i +u +j +d +r +ó +ñ +q +m +á +e +v +k +p +n +l +b +x +- +í + +é +t +y +h +— +ú diff --git a/full_models/quz/D_100000.pth b/full_models/quz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..624e851c0cbb98fd57588ba2fc2334b200dec50b --- /dev/null +++ b/full_models/quz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fd86a89725af83c7faf37d3824db296563871f8d357e07578f6183a992ffb0 +size 561078748 diff --git a/full_models/quz/G_100000.pth b/full_models/quz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..809d1147f20b681b874de7340450b3fce47a991d --- /dev/null +++ b/full_models/quz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1723774e696a2f11c58ce5e89a2ee2b47aad65955b0abae3d8865af28adf9364 +size 436378676 diff --git a/full_models/quz/config.json b/full_models/quz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/quz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/quz/vocab.txt b/full_models/quz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4c92935cde7905d4c5f08c968d5897a8f31e7801 --- /dev/null +++ b/full_models/quz/vocab.txt @@ -0,0 +1,37 @@ +a +| +n +i +u +q +k +s +h +p +y +c +t +m +r +l +o +w +e +ñ +' +d +j +g +b +- +– +v +f +í +z +é +á +ó +ú +x + diff --git a/full_models/qvc/D_100000.pth b/full_models/qvc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..435909ae9494a15fd6b77441a828f3d3b1e2845d --- /dev/null +++ b/full_models/qvc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34bbb564e3542a751a7b3570779c0652a5432fd6c771ef863623ab958e90f19 +size 561078613 diff --git a/full_models/qvc/G_100000.pth b/full_models/qvc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..19209e1645ed56e1608d8eb69f91847531255259 --- /dev/null +++ b/full_models/qvc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d8bab5c38a946abb08d180ec32af99958aaaa3fe8fdcfa600f94a1a6ba5a33f +size 436387398 diff --git a/full_models/qvc/config.json b/full_models/qvc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvc/vocab.txt b/full_models/qvc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..eb8a5365ff1e8f63b336197dbe2a294f0cd0d7a0 --- /dev/null +++ b/full_models/qvc/vocab.txt @@ -0,0 +1,42 @@ +a +| +i +n +u +h +y +s +q +k +p +m +l +r +c +t +d +w +b +g +j +o +ñ +— +f +e +0 +á +4 +2 +˻ +˼ +í +1 +5 +' +3 +8 +9 +7 +6 + diff --git a/full_models/qve/D_100000.pth b/full_models/qve/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eef351f601f846b67895cf7e8b7fddcb9102e06f --- /dev/null +++ b/full_models/qve/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90484d2dda789cbe50f764cca1280353289a9e4f6b730c09c06831bd083522a9 +size 561077938 diff --git a/full_models/qve/G_100000.pth b/full_models/qve/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c8fe3338c725460cc1b0abbff873a6f13067c198 --- /dev/null +++ b/full_models/qve/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ecf5fa137ee6bafd2ab0a6dbe399e5e22a9f47c56dcd1629f36c185d9b0c75e +size 436382777 diff --git a/full_models/qve/config.json b/full_models/qve/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qve/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qve/vocab.txt b/full_models/qve/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..71deada434a78e4c4a6ac4fee74bf436c3c8e658 --- /dev/null +++ b/full_models/qve/vocab.txt @@ -0,0 +1,40 @@ +a +| +n +i +u +s +k +q +h +p +c +t +y +r +m +l +o +e +w +d +ñ +j +b +' +g +v +f +á +— +z +í +ó +é +- +ú +x +0 +1 +2 + diff --git a/full_models/qvh/D_100000.pth b/full_models/qvh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5daa0fc83984904a278c640035b82f627566246b --- /dev/null +++ b/full_models/qvh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff16582cc2d9edd280c076033ccab7fb2334846684bc103c4e2ec71da7aab7fe +size 561078640 diff --git a/full_models/qvh/G_100000.pth b/full_models/qvh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4658294bafa42d9fb3d726946d67feb5422c861 --- /dev/null +++ b/full_models/qvh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:091b6d55e43149ec1835e5f24972f3921771a48513d7d20c8f36b4316447f236 +size 436386321 diff --git a/full_models/qvh/config.json b/full_models/qvh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvh/vocab.txt b/full_models/qvh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..788f578bc0450d7b8fd9e19248ee632540f27f74 --- /dev/null +++ b/full_models/qvh/vocab.txt @@ -0,0 +1,41 @@ +ë +f +h +ü +z +o +x +ñ +ä +y +r +d +i +t +ö +k +l +_ +q +u +ï +n +c +v + +é +ó +b +g +j +í +- +ú +m +p +e +á +s +a +' +w diff --git a/full_models/qvm/D_100000.pth b/full_models/qvm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fb648b8507b8bdd425e7e02046feab8e639a5331 --- /dev/null +++ b/full_models/qvm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c94a71f8721310ef4f9a3d30a7eda327227713205bac0cb4406ecd8970392ccc +size 561078597 diff --git a/full_models/qvm/G_100000.pth b/full_models/qvm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e18b5bab88e774e7a0a7a64221c591062552d405 --- /dev/null +++ b/full_models/qvm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b05f9be55b0c724f8cdb4876a10bec95dcca554e4140184902d99b91be86c2 +size 436385104 diff --git a/full_models/qvm/config.json b/full_models/qvm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvm/vocab.txt b/full_models/qvm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b9e4b6519521ac16922d28b603c2066cd88fda09 --- /dev/null +++ b/full_models/qvm/vocab.txt @@ -0,0 +1,41 @@ +a +| +n +i +c +u +s +t +g +y +p +r +m +h +o +l +e +ä +w +q +j +d +b +ö +ë +f +v +- +ï +ú +z +á +ü +é +ñ +í +ó +x +' +k + diff --git a/full_models/qvn/D_100000.pth b/full_models/qvn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0d452db66029a4ef87bcf6721c19874451c16fdc --- /dev/null +++ b/full_models/qvn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc0b81f0dfa592346295107ae702afed24121efd241a8d55634c742cd202c82 +size 561078610 diff --git a/full_models/qvn/G_100000.pth b/full_models/qvn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8ff6b5e50763aa7ca6df09c6ce710a1bf22699d5 --- /dev/null +++ b/full_models/qvn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c8466d7e26c5b6ec484ab4731bb9687dd176dafc0ad016fd4d3e1712a7a063 +size 436387486 diff --git a/full_models/qvn/config.json b/full_models/qvn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvn/vocab.txt b/full_models/qvn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7b42f9fc8d70bc41a9630af3d14a1d3f02889cd4 --- /dev/null +++ b/full_models/qvn/vocab.txt @@ -0,0 +1,42 @@ +a +| +n +c +u +i +r +y +m +g +h +s +p +t +ä +l +o +w +j +e +d +q +b +ü +ï +- +v +z +ë +f +ñ +ö +é +ú +í +' +á +ó +x +— +k + diff --git a/full_models/qvo/D_100000.pth b/full_models/qvo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c08e7f69e2d1f44a51c85e03dc20da22d37ff42b --- /dev/null +++ b/full_models/qvo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7421d4a4d127aeb317e0759e593f3856fd1794fea1de48b6d44f1753c18db2d8 +size 561078722 diff --git a/full_models/qvo/G_100000.pth b/full_models/qvo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..181cabc7969141d66f15403e3935ffe653083077 --- /dev/null +++ b/full_models/qvo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6cde753017fb66265a5d6570fb6cd83eeab377d17a7d1e75e2636cb276376a +size 436375981 diff --git a/full_models/qvo/config.json b/full_models/qvo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvo/vocab.txt b/full_models/qvo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..01aec67a54d1a5ffee6fcf279bd3ab3d5fb6873d --- /dev/null +++ b/full_models/qvo/vocab.txt @@ -0,0 +1,36 @@ +a +c +| +i +u +n +h +s +p +t +r +m +l +y +q +o +ñ +j +e +d +— +b +- +g +f +v +z +' +ó +x +í +á +k +ú +é + diff --git a/full_models/qvs/D_100000.pth b/full_models/qvs/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fc12e8a5bde43da6c21988bac237e154491168b8 --- /dev/null +++ b/full_models/qvs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64df966a1b6e99442c1ff1df33a05402d7bc8ba2c6e2bb2003504fe0c3fe68e4 +size 561078125 diff --git a/full_models/qvs/G_100000.pth b/full_models/qvs/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ad8fb0877c8de5510a7d2302541630a65f7a36d --- /dev/null +++ b/full_models/qvs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd3fa0a0142c43cb3b10a39955c4bc9d449bb2dfd2b291ac9713c8cc3d16284 +size 436362179 diff --git a/full_models/qvs/config.json b/full_models/qvs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvs/vocab.txt b/full_models/qvs/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3455d89a6679be3ae4f175e22f534be0f7e686ae --- /dev/null +++ b/full_models/qvs/vocab.txt @@ -0,0 +1,31 @@ +a +| +n +k +i +u +h +s +t +p +y +c +r +l +m +w +e +d +o +j +ñ +b +g +v +— +f +í +á +x +z + diff --git a/full_models/qvw/D_100000.pth b/full_models/qvw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8dcd68b922d93be7ab976320204053794d850b1b --- /dev/null +++ b/full_models/qvw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08de375931267cb8cd57cdd574a4d171de475315b3ee9795710e3b854c7b8734 +size 561078754 diff --git a/full_models/qvw/G_100000.pth b/full_models/qvw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0e38fe4b0d3b63c5454f3729626ab11942d7c96d --- /dev/null +++ b/full_models/qvw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f46a0d552405d6db5439f84872a564113c5719a7d7bb8c63f4a70ed6e66a42f +size 436399506 diff --git a/full_models/qvw/config.json b/full_models/qvw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvw/vocab.txt b/full_models/qvw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4722a0ac5bcb7e62eb97d13c18a76609ce60d906 --- /dev/null +++ b/full_models/qvw/vocab.txt @@ -0,0 +1,46 @@ +a +| +c +n +i +u +l +y +h +m +p +t +s +ä +w +ć +q +ś +r +ü +j +ñ +d +ï +' +o +á +e +- +b +g +f +ú +í +v +z +ë +é +˻ +˼ +x +k +ó +— +ö + diff --git a/full_models/qvz/D_100000.pth b/full_models/qvz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c38fe2c62b152a87a15adea66798cbf07b33df9a --- /dev/null +++ b/full_models/qvz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6619f1a2073f116ab09a64ca8c11e6433a381d60b1b7f0b8a12af3840ce4d40 +size 561078727 diff --git a/full_models/qvz/G_100000.pth b/full_models/qvz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ffe5c4874b1ee9b2e5046801a96afa11933a85b2 --- /dev/null +++ b/full_models/qvz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3391f2da3dedb9f92fb4c129cab0072820d4dda42cbe1b7d75d6a8e3bffec12 +size 436371399 diff --git a/full_models/qvz/config.json b/full_models/qvz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qvz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qvz/vocab.txt b/full_models/qvz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0a8b70e9731597976a86d41f973316f8c8c4a4b3 --- /dev/null +++ b/full_models/qvz/vocab.txt @@ -0,0 +1,35 @@ +a +| +i +u +c +n +h +s +t +r +m +g +l +p +y +d +o +ñ +b +e +q +j +z +á +v +f +- +ü +í +ó +ú +é +x +k + diff --git a/full_models/qwh/D_100000.pth b/full_models/qwh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff7d6d5ebceae5784e2c84c9d72b5fb9d150c8a3 --- /dev/null +++ b/full_models/qwh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:287e3e2ced7280a09d1f8aa05bd259d41df7cf6cda142cb35279e148057d1870 +size 561078857 diff --git a/full_models/qwh/G_100000.pth b/full_models/qwh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a4889ed80e36c775a7b8f1eee4f0560be24f09a1 --- /dev/null +++ b/full_models/qwh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:536100218903769ba6c7fbd3261e055543226b4f1cb3b0480fd6a136730d1556 +size 436379068 diff --git a/full_models/qwh/config.json b/full_models/qwh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qwh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qwh/vocab.txt b/full_models/qwh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d90900fdfee34528b5253e5917ed5f0502480549 --- /dev/null +++ b/full_models/qwh/vocab.txt @@ -0,0 +1,37 @@ +a +| +n +i +u +c +q +s +t +r +e +m +p +l +o +y +h +w +ä +d +j +b +ë +g +ï +— +f +ñ +ö +ü +z +v +˻ +˼ +x +' + diff --git a/full_models/qxh/D_100000.pth b/full_models/qxh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..784440e080f4e0b32189b564a41fba3e64ae9093 --- /dev/null +++ b/full_models/qxh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c86ed8580d994f469aa3358887a0507120956bbfe30317ee22813fba0bdc5b9 +size 561078587 diff --git a/full_models/qxh/G_100000.pth b/full_models/qxh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bde08834e0417160aca5f7286876649b21da9009 --- /dev/null +++ b/full_models/qxh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b606293dd60371882654e359733634b058030dfa7b118b5883790b64d6104db +size 436387512 diff --git a/full_models/qxh/config.json b/full_models/qxh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qxh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qxh/vocab.txt b/full_models/qxh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f16161ac7c8853324920072269a86956dff021f4 --- /dev/null +++ b/full_models/qxh/vocab.txt @@ -0,0 +1,42 @@ +a +| +n +i +u +c +h +s +r +p +t +m +y +l +j +w +q +ä +g +ć +d +o +e +- +ñ +ú +ç +ü +ï +b +é +í +f +ó +á +z +v +x +k +2 +­ + diff --git a/full_models/qxl/D_100000.pth b/full_models/qxl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a207ce2e66483e72e822badf14a8f4157582ff9d --- /dev/null +++ b/full_models/qxl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:942ef5e7f07b8fdfea382e4eee27ed9eddaf8f9b39462c98933d752816a77f42 +size 561078710 diff --git a/full_models/qxl/G_100000.pth b/full_models/qxl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8332c8b2aed8322e05d464c677e8655f498cd3f0 --- /dev/null +++ b/full_models/qxl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068c04f44f3a564a738aa19200173effb12f6dcdae0603cca7fa31ee597dc617 +size 436379941 diff --git a/full_models/qxl/config.json b/full_models/qxl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qxl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qxl/vocab.txt b/full_models/qxl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..225f05e9b886320f12026cdb6fc75f93747834e1 --- /dev/null +++ b/full_models/qxl/vocab.txt @@ -0,0 +1,38 @@ +í +– +- +n +w +k +ú +z +' +q +r +d +c +ó +p +é +m +e +_ +h +t +x +o +f +u +s +i +ñ + +v +ü +y +l +b +á +a +j +g diff --git a/full_models/qxn/D_100000.pth b/full_models/qxn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3de675f3c9013ebee79acfe01b9db729a45d24bb --- /dev/null +++ b/full_models/qxn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970ecc4c538f224b4309bbe7f77f733b91699716eb7e6299075528f2ec9798da +size 561078604 diff --git a/full_models/qxn/G_100000.pth b/full_models/qxn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d9edf43bcfcdfbd255b5130bf0b106c7974340e6 --- /dev/null +++ b/full_models/qxn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e2debf5ed8e4513aa05e1bd33205413c44bfd94673699e82c06e4e5b71f9a1 +size 436385208 diff --git a/full_models/qxn/config.json b/full_models/qxn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qxn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qxn/vocab.txt b/full_models/qxn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..09d9f614c2b8b3f32eb584745da8b28e58b7c797 --- /dev/null +++ b/full_models/qxn/vocab.txt @@ -0,0 +1,41 @@ +a +| +n +i +u +c +s +y +t +r +g +m +p +l +o +e +h +ä +w +q +ö +d +j +ñ +b +ï +f +v +ë +ü +z +é +í +ó +á +ú +x +k +' +- + diff --git a/full_models/qxo/D_100000.pth b/full_models/qxo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..561d9c0b3f8e6b3b452c2c2a8f3fc6e28019e168 --- /dev/null +++ b/full_models/qxo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f27193bcbb2145a3840eb8873aff12ec4ddb43f1112caa80f4f85ad4455fdd03 +size 561078619 diff --git a/full_models/qxo/G_100000.pth b/full_models/qxo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7436c0abd9b38cf21bc599902d8a32fa1b02fdbf --- /dev/null +++ b/full_models/qxo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f545ca780b5fba79960e115c5865bae324b268bcae3c11e1b97bec601017ad9 +size 436380580 diff --git a/full_models/qxo/config.json b/full_models/qxo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qxo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qxo/vocab.txt b/full_models/qxo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..36bfa5a4967867dd8782b60a00dc6dc57828c7aa --- /dev/null +++ b/full_models/qxo/vocab.txt @@ -0,0 +1,39 @@ +a +| +n +i +u +c +t +y +s +r +m +g +p +l +ä +h +o +e +ö +w +q +d +j +ñ +b +ï +v +ë +f +ü +z +- +0 +' +x +1 +2 +k + diff --git a/full_models/qxr/D_100000.pth b/full_models/qxr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3e14038b16a12f85f39ba34bd1903cb958489929 --- /dev/null +++ b/full_models/qxr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c5f49f33456397392b73c05f719e2576401c643645f85637ca49fdc3e200b4 +size 561078380 diff --git a/full_models/qxr/G_100000.pth b/full_models/qxr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5a5e68786ba54e41c117e41f8186cf10d6ba353e --- /dev/null +++ b/full_models/qxr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78f7d9407b9fcb66e2c61e191743768c695c913cb62bb48131d3d275e3d8e1b +size 436371087 diff --git a/full_models/qxr/config.json b/full_models/qxr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/qxr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/qxr/vocab.txt b/full_models/qxr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..77c09ef5c8f43ee2476e28e8340918e5b9bac82c --- /dev/null +++ b/full_models/qxr/vocab.txt @@ -0,0 +1,36 @@ +o +ü +v +f +ó +k + +n +g +ú +x +p +— +m +d +q +- +z +ñ +_ +é +á +i +u +t +a +b +j +y +h +e +s +l +c +í +r diff --git a/full_models/rah/D_100000.pth b/full_models/rah/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ac6ef96ff294b178416e33c5836c11752681c33 --- /dev/null +++ b/full_models/rah/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92377d17e02607b4a8e11ce99fbbe9ee5ed8ae432375e7a17a6a7c81a7d375d6 +size 561075935 diff --git a/full_models/rah/G_100000.pth b/full_models/rah/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..44ae119b650a3599b7da7fb8b971350b87bf06a7 --- /dev/null +++ b/full_models/rah/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea0c61a35f6f9ff804957944353d1ca854c92f6741fd910c84e48d373b7e639 +size 436363308 diff --git a/full_models/rah/config.json b/full_models/rah/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rah/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rah/vocab.txt b/full_models/rah/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5c0a9108f62c99960d83dd1a36c79277f6a79c26 --- /dev/null +++ b/full_models/rah/vocab.txt @@ -0,0 +1,40 @@ +ক +চ +ে +া +ব +ই +য +এ +ঃ +ৰ +হ +ৱ +ৗ +প +দ +থ +জ +ম +খ +গ +_ +ল +ং +্ +ছ +ভ +ু +ি +ো +অ +ন +আ +' +ও +ত +ঙ +ফ + +উ +় diff --git a/full_models/rai/D_100000.pth b/full_models/rai/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0cbdb7f52828f0444869c41c380defd07d817fd0 --- /dev/null +++ b/full_models/rai/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fd9e3aa183fb1eb52c1bd3e1f6b63e417e21efe603b22909340d54b65fa89d +size 561078741 diff --git a/full_models/rai/G_100000.pth b/full_models/rai/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5da42400acceb31703e13e91b31e8fccc1dbd0a6 --- /dev/null +++ b/full_models/rai/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499a411ef8702f4901ed79a3652fe39298467809e7fe6946aded3aa82f78f0d2 +size 436366658 diff --git a/full_models/rai/config.json b/full_models/rai/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rai/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rai/vocab.txt b/full_models/rai/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c8fb3571881d49c8e39351600e92ee9e38ed3158 --- /dev/null +++ b/full_models/rai/vocab.txt @@ -0,0 +1,32 @@ +a +| +i +n +u +t +m +r +k +p +o +d +g +b +l +w +e +s +1 +2 +0 +7 +4 +6 +5 +3 +' +8 +9 +- +f + diff --git a/full_models/rap/D_100000.pth b/full_models/rap/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..250030c2f691e764965a266bf02b1f8a6051dc35 --- /dev/null +++ b/full_models/rap/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816101cc177460b7488625d73a1463e4ac8dcd04c06675bfb25e240e07a2240d +size 561077947 diff --git a/full_models/rap/G_100000.pth b/full_models/rap/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ef0e4d9eb379e5ab07cfb8e271bccbfa1a5cb853 --- /dev/null +++ b/full_models/rap/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bec381e9ec66f52ce27fb70500bddfb75acb4380567155f393fca11674415ced +size 436370211 diff --git a/full_models/rap/config.json b/full_models/rap/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rap/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rap/vocab.txt b/full_models/rap/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5f170e51e1f6e44620796a934b0519b0bd4fb5e0 --- /dev/null +++ b/full_models/rap/vocab.txt @@ -0,0 +1,37 @@ +l +á +ŋ +d +b +ī +n +j +g +h +ū +— +o +k +ó +s +e +f +ā +- +m +_ +u +p + +a +ē +ō +' +í +v +z +r +c +ꞌ +t +i diff --git a/full_models/rav/D_100000.pth b/full_models/rav/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81bbbdc6aaece45fa282001365e97b7915c42432 --- /dev/null +++ b/full_models/rav/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1f060946cc03ec6f5b3ad85ba438fe090294f34f09ea5d07fb80ca66893ec9 +size 561079119 diff --git a/full_models/rav/G_100000.pth b/full_models/rav/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d9fd1cad18856a615b7950fffb820a4b2e653cfc --- /dev/null +++ b/full_models/rav/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:985d16ef26a0ebed80d1854f8edf4dc24689b2b2676fe58699923a0739387bc3 +size 436424730 diff --git a/full_models/rav/config.json b/full_models/rav/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rav/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rav/vocab.txt b/full_models/rav/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..22593b3fcfb367b26467fb73d29189d10aaf6981 --- /dev/null +++ b/full_models/rav/vocab.txt @@ -0,0 +1,56 @@ +ा +| +ी +म +् +क +न +ू +‍ +ल +त +स +ख +प +ँ +ो +च +व +र +ई +य +ब +ङ +े +आ +छ +ह +ध +द +ऊ +ग +ए +झ +अ +भ +थ +ज +ट +फ +ढ +ड +ः +ठ +़ +घ +ओ +ं +' +- +ृ +उ +ऐ +इ +ण +श + diff --git a/full_models/raw/D_100000.pth b/full_models/raw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b422af9d8890cc0cff07b4a60091bec9b1c3ec58 --- /dev/null +++ b/full_models/raw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40326761a00cb4b6b4285ce5bbf89f0a10e5b6b2ad28c3c3a465cb8dbe4d63fe +size 561078873 diff --git a/full_models/raw/G_100000.pth b/full_models/raw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..88d9ff469bcb1f4df1a2618a941f359ad55c4d93 --- /dev/null +++ b/full_models/raw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb485fe4ac162b0859924cd5e9af87ac93bbba15b24b611892fa57eac42775ff +size 436419480 diff --git a/full_models/raw/config.json b/full_models/raw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/raw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/raw/vocab.txt b/full_models/raw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..afd6f5b3f461aab19ae36f0b9d334e45dd7c46ce --- /dev/null +++ b/full_models/raw/vocab.txt @@ -0,0 +1,54 @@ +u +è +4 +ú +á +' +y +ā +ù +- +é +c +d +ò +f +à +w +í +z +q +2 +t +n +a +ó +v +j +m + +r +́ +ø +s +_ +i +l +ō +b +̀ +1 +h +ï +ū +̄ +g +ì +p +0 +ē +k +ǿ +6 +e +o diff --git a/full_models/rej/D_100000.pth b/full_models/rej/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a2341de237fa6ac7da077836181c09d0ceabbf75 --- /dev/null +++ b/full_models/rej/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c27e3015750dd612cad378a82057d018dfeeed46d7084d04a367f77f697de9f2 +size 561078896 diff --git a/full_models/rej/G_100000.pth b/full_models/rej/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..abdb9d0067a7360e637f1476f74fb711c706cf5c --- /dev/null +++ b/full_models/rej/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a19ddcc959c4c9b7ae255c043a2a1e214fefe326d6a825ae7ee0c5c8cbc190 +size 436369628 diff --git a/full_models/rej/config.json b/full_models/rej/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rej/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rej/vocab.txt b/full_models/rej/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b22700400c5f28ea9f23c4bd0652f5eec8dbea19 --- /dev/null +++ b/full_models/rej/vocab.txt @@ -0,0 +1,33 @@ +e +d +b +v +_ +6 +z +m +1 +s +g +a +h +w +t +i +0 +p +y +' +- +4 +r + +o +j +u +n +2 +l +k +f +c diff --git a/full_models/rel/D_100000.pth b/full_models/rel/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..038a5ecb9a4d6ef311cfa142dad49e2976dcb120 --- /dev/null +++ b/full_models/rel/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f26b639bffe073b70344e9b356d2822268608bba19ce76a7f58cfffec37fdc5 +size 561078250 diff --git a/full_models/rel/G_100000.pth b/full_models/rel/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c345ded3c883ba0bf3d47d88ea35c992ba057dc0 --- /dev/null +++ b/full_models/rel/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ea87bba774b7d8cc73740bc338a26a4339ab7f7a7ca0414141717684c05437 +size 436354123 diff --git a/full_models/rel/config.json b/full_models/rel/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rel/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rel/vocab.txt b/full_models/rel/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8b77c719f7f7ae6c7dbf4c692b6b09ffd5397a7f --- /dev/null +++ b/full_models/rel/vocab.txt @@ -0,0 +1,29 @@ +o +e +l +h +f +b +m +' +é +s +ú +a +ó +r +u +i +n +k +t +d +á +g +c +j +w +y +í + +_ diff --git a/full_models/rgu/D_100000.pth b/full_models/rgu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e9567ee3de7cda7ad07390763a86c68c61e5fc5c --- /dev/null +++ b/full_models/rgu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebcc727b5b5467e2d03e2f7d823f9d507389c7c37853e52c9975837af5862110 +size 561075770 diff --git a/full_models/rgu/G_100000.pth b/full_models/rgu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fddf5b5be962e1341b48e8f31ef1474c3aa2ded1 --- /dev/null +++ b/full_models/rgu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:880ad400e924300037e896a91037aefaae617b10f04ab0cbb11e5533fdd2ab4f +size 436324665 diff --git a/full_models/rgu/config.json b/full_models/rgu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rgu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rgu/vocab.txt b/full_models/rgu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e21e8b188bad7b39fca0f7fe0c1bb7db6ef2312e --- /dev/null +++ b/full_models/rgu/vocab.txt @@ -0,0 +1,24 @@ +l +_ +d +a +n +y +c +t +b +h +k +s +r +f +e +g +p +m + +- +' +i +u +o diff --git a/full_models/rhg/D_100000.pth b/full_models/rhg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..880b1d1637d24d284b66273da0ed2f8288238677 --- /dev/null +++ b/full_models/rhg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebef13408caf2e1b2993da7fe5c60e894185b5b1bc077be4ae69455a42ddb002 +size 561076074 diff --git a/full_models/rhg/G_100000.pth b/full_models/rhg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c50b034827b39d0da71ac45c60e167d83f6e2591 --- /dev/null +++ b/full_models/rhg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b67a78240b98b0227bc83d3ad87da4d6e006d87a2b41798e283bd684da7dc6 +size 436352951 diff --git a/full_models/rhg/config.json b/full_models/rhg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rhg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rhg/vocab.txt b/full_models/rhg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..67784e17da0a9339dbf514514a6113a0fb7a39ef --- /dev/null +++ b/full_models/rhg/vocab.txt @@ -0,0 +1,35 @@ +t +n +s +j +e +l +u +í +f + +ñ +z +o +p +v +m +ú +_ +a +y +g +ç +i +r +c +w +h +é +b +á +- +' +d +ó +k diff --git a/full_models/rif-script_arabic/D_100000.pth b/full_models/rif-script_arabic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d779c49254aad66326fbcca132b64fc07917506c --- /dev/null +++ b/full_models/rif-script_arabic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa9546308c5f5930c45760b555862a3c3a9ddda827e2778cde4a522daf85e20 +size 561078973 diff --git a/full_models/rif-script_arabic/G_100000.pth b/full_models/rif-script_arabic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..056ba1e03621356922d5cff83c23aa575f9ae6e4 --- /dev/null +++ b/full_models/rif-script_arabic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25dfcbe6cc6b84dfdf11dace9f89a3ca3116c38d2287e3e35a208800e1ef3038 +size 436391186 diff --git a/full_models/rif-script_arabic/config.json b/full_models/rif-script_arabic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rif-script_arabic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rif-script_arabic/vocab.txt b/full_models/rif-script_arabic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4d6bdbd29ef4cd90a6d790f3dc5450c8f41617ab --- /dev/null +++ b/full_models/rif-script_arabic/vocab.txt @@ -0,0 +1,43 @@ +ڒ +ذ +ط +پ +ث +ت +و +ز +ݣ +_ +س +ظ +ض +ژ +آ +ٱ +ص +- +ى +أ +ا +ك + +ع +ي +ن +ج +ئ +د +خ +م +ب +ؤ +ء +إ +ه +ر +ف +غ +ق +ح +ل +ش diff --git a/full_models/rif-script_latin/D_100000.pth b/full_models/rif-script_latin/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..2162fae85b22d85135f1cbd958fa4bb7ff96b183 --- /dev/null +++ b/full_models/rif-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0f09088858ab6dfce928122060ebeed3d1abdc457d46a3c9cafaf6e4de0bbc +size 561078832 diff --git a/full_models/rif-script_latin/G_100000.pth b/full_models/rif-script_latin/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ba4b1d838b39cf140461975149a7d839a0d3702 --- /dev/null +++ b/full_models/rif-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb23a9df0830cfa296ae437c425bb28d77a39623ce46fb0a2f1e3babe4fbd8b +size 436387026 diff --git a/full_models/rif-script_latin/config.json b/full_models/rif-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rif-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rif-script_latin/vocab.txt b/full_models/rif-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..20e5069d4c536e7d1ac26c83bc464879cfe1f692 --- /dev/null +++ b/full_models/rif-script_latin/vocab.txt @@ -0,0 +1,41 @@ +| +a +n +i +e +m +r +s +ḏ +u +w +ṯ +y +b +t +ȓ +c +ɣ +l +d +ƹ +q +j +z +k +ḥ +- +f +x +g +ṣ +ṭ +h +ḍ +ǧ +ʼ +ẓ +p +č +' + diff --git a/full_models/ril/D_100000.pth b/full_models/ril/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7bdc1ddf6c0981691c2bde33445ed069c2411887 --- /dev/null +++ b/full_models/ril/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c659fcf190381ca6ae064c1c58b69bcf1a6ee3e3afb57da566cd8e2fcba573fb +size 561076028 diff --git a/full_models/ril/G_100000.pth b/full_models/ril/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..75e5caf38e773b05c7e2ac3c5bd746342e3ee1b6 --- /dev/null +++ b/full_models/ril/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1a4ff64df4c67b9faef95edb9043fcd24420d2a131b02654837e0881e3e78f +size 436333656 diff --git a/full_models/ril/config.json b/full_models/ril/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ril/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ril/vocab.txt b/full_models/ril/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..35ecd7b5fb13fb8130311550fe18a09d4fc71220 --- /dev/null +++ b/full_models/ril/vocab.txt @@ -0,0 +1,27 @@ +| +a +z +h +e +n +u +k +i +t +m +w +r +p +o +g +l +s +d +y +c +b +9 +1 +0 +' + diff --git a/full_models/rim/D_100000.pth b/full_models/rim/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20f7af6d57f65c7759fd597b59d24db16c70c7b9 --- /dev/null +++ b/full_models/rim/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9b218208e15bb2f4fa9f85dfb7baeda21122b3a752ed6e476f0de4c4bfa34e2 +size 561079017 diff --git a/full_models/rim/G_100000.pth b/full_models/rim/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..711d670d8d360d04734beb321c0e0ae87aed7219 --- /dev/null +++ b/full_models/rim/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7ea87571f226a019f4a608b6b831b33a9b3b8243007e86e9538b1311a1fb5d +size 436364807 diff --git a/full_models/rim/config.json b/full_models/rim/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rim/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rim/vocab.txt b/full_models/rim/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f5a54e3cb42d29563e01be8906a3bd79131dc113 --- /dev/null +++ b/full_models/rim/vocab.txt @@ -0,0 +1,30 @@ +| +a +u +n +e +ë +m +i +g +o +w +t +k +y +h +s +r +v +d +f +j +b +ü +l +' +c +p +z +- + diff --git a/full_models/rjs/D_100000.pth b/full_models/rjs/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b62ad901162b14050a449ff14f3c86e86e828ce --- /dev/null +++ b/full_models/rjs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2482faecb8f5d8b8387146dd9499901d0a41ac8736136ab5620c660b58e1b0 +size 561078490 diff --git a/full_models/rjs/G_100000.pth b/full_models/rjs/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c73f261d132b22a9ca7715cbb44ebc2b79a8b98e --- /dev/null +++ b/full_models/rjs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda3352afce5dfe6452f0ba065fcb89fcba9016f2576abf2d2db0bb3474b5eec +size 436431466 diff --git a/full_models/rjs/config.json b/full_models/rjs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rjs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rjs/vocab.txt b/full_models/rjs/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bebd1e42e4e681cd55d3848001e0d7c7f29f53db --- /dev/null +++ b/full_models/rjs/vocab.txt @@ -0,0 +1,62 @@ +झ +ङ +े +स +म +ग +अ +ृ +_ +ट +फ +च +ल +ऩ +भ +घ +ऱ +३ +त +ि +‍ +4 +थ +1 +ख +ह +उ +' +ओ +य +ध +ए +ड +द +ज +q +ठ +इ +ो +़ +ँ +क +3 +i +m +प +र +ु +ढ +ं +ा +ब +श +छ +६ +आ +l +व +न +् + +2 diff --git a/full_models/rkt/D_100000.pth b/full_models/rkt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..753c614ab3947ed3e29eee39f66fc934d56e3807 --- /dev/null +++ b/full_models/rkt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d58a4efd070aa42c8d696603377a33c13f6067ffdc7232919032d7279c29996 +size 561078857 diff --git a/full_models/rkt/G_100000.pth b/full_models/rkt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2575e1822bcd5bf9215113101f9565aef97efab2 --- /dev/null +++ b/full_models/rkt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:422c9ee299134fc6c99cb7aa37faff1c229e97b8a90346deabc5e83e5cfb2418 +size 436438657 diff --git a/full_models/rkt/config.json b/full_models/rkt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rkt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rkt/vocab.txt b/full_models/rkt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4213897afa996dff4df1cfb7465334db3b34a274 --- /dev/null +++ b/full_models/rkt/vocab.txt @@ -0,0 +1,63 @@ +ধ +এ +ঝ +ৈ +ঢ +ঁ +ত +য +ঠ +অ +ফ +ঙ +ৎ +ং +ল +া +খ +ূ +ঈ +ন +় +ছ +ট +ৌ +শ +আ + +ঐ +ষ +জ +্ +ম +ব +ৃ +ও +ঋ +ঘ +র +ণ +ভ +— +ি +ঞ +_ +ই +ু +ী +চ +ড +উ +- +প +ঔ +' +ো +ে +দ +ঃ +থ +গ +ক +হ +স diff --git a/full_models/rmc-script_cyrillic/D_100000.pth b/full_models/rmc-script_cyrillic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c9b2cd01147cfe81d59b762358582b5cb3bbbe22 --- /dev/null +++ b/full_models/rmc-script_cyrillic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2855afb99c6a15d91c0e399e8d0bfc54b5256ed119de41ee4d581eb06555dd16 +size 561076024 diff --git a/full_models/rmc-script_cyrillic/G_100000.pth b/full_models/rmc-script_cyrillic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fe4f37426467b1fece039d0355d5d73925faa061 --- /dev/null +++ b/full_models/rmc-script_cyrillic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a58e57690262753d3129a919238eea3b98629ec3a82b1a8921af0607f80e1031 +size 436356144 diff --git a/full_models/rmc-script_cyrillic/config.json b/full_models/rmc-script_cyrillic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rmc-script_cyrillic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rmc-script_cyrillic/vocab.txt b/full_models/rmc-script_cyrillic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..aefe5715064fff290276443625d0cdc78b8f531f --- /dev/null +++ b/full_models/rmc-script_cyrillic/vocab.txt @@ -0,0 +1,37 @@ +| +а +е +н +о +р +с +л +д +і +к +в +т +п +є +м +у +г +я +й +ґ +б +ч +ш +и +ж +з +— +х +ц +ь +ї +ф +ю +щ +- + diff --git a/full_models/rmc-script_latin/D_100000.pth b/full_models/rmc-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4accf74a48720019b947af7a498b8360f941d38f --- /dev/null +++ b/full_models/rmc-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172e56a61d783c7d068e7f9512c4c9bc05a2b7b713956cb297471c851475c715 +size 561078717 diff --git a/full_models/rmc-script_latin/G_100000.pth b/full_models/rmc-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3123fd3cef1ed428905dc88ee98f77e22a96136 --- /dev/null +++ b/full_models/rmc-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7163c6b2ee92369682847814e0253c5193ed190e7f12e8b27af56d75ff675e07 +size 436387544 diff --git a/full_models/rmc-script_latin/config.json b/full_models/rmc-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rmc-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rmc-script_latin/vocab.txt b/full_models/rmc-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ccd5b3ff4fb77bbbafaaf4223ac5e92ac3aebc82 --- /dev/null +++ b/full_models/rmc-script_latin/vocab.txt @@ -0,0 +1,41 @@ +š +c +_ +b +ď +p +h +` +- +3 +ž +t + +' +ľ +z +j +5 +y +u +o +ó +x +1 +v +f +n +a +i +e +d +ť +s +m +k +ň +2 +r +č +l +g diff --git a/full_models/rmo/D_100000.pth b/full_models/rmo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..50c33b37df795942975948cb0972c75d76d8c7f0 --- /dev/null +++ b/full_models/rmo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9480e52e5811f5688d787214f129c4eb089dda3f56f377f72b111a7ae81f72aa +size 561078724 diff --git a/full_models/rmo/G_100000.pth b/full_models/rmo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6031ce5195466968669a6414b2f5feed26459968 --- /dev/null +++ b/full_models/rmo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6d7c694c4fd5099555b2ff2efe3e8050e4756197bf612bcabe3874aab3fbfc8 +size 436355280 diff --git a/full_models/rmo/config.json b/full_models/rmo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rmo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rmo/vocab.txt b/full_models/rmo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2d3731842151ea2a8cac438fe4725818860ac834 --- /dev/null +++ b/full_models/rmo/vocab.txt @@ -0,0 +1,28 @@ +| +e +a +n +o +l +r +s +i +k +t +h +d +u +p +m +w +j +b +c +g +f +- +v +z +x +y + diff --git a/full_models/rmy-script_cyrillic/D_100000.pth b/full_models/rmy-script_cyrillic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..851e803083161883b079bb95955719099d1b95fd --- /dev/null +++ b/full_models/rmy-script_cyrillic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc5899175bf981fff359d98c7a168a06340ab228e96e96c4b9180371c569266 +size 561075939 diff --git a/full_models/rmy-script_cyrillic/G_100000.pth b/full_models/rmy-script_cyrillic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f4aa8cca91131d70f9871da43e4b8de6b81a7deb --- /dev/null +++ b/full_models/rmy-script_cyrillic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5daf355be4fce14ae76d14bafadfd15d22d6ea49b2abdb052d2843d1d550bb30 +size 436356009 diff --git a/full_models/rmy-script_cyrillic/config.json b/full_models/rmy-script_cyrillic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rmy-script_cyrillic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rmy-script_cyrillic/vocab.txt b/full_models/rmy-script_cyrillic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e3c4015f3630c44cd8b3e206ae14985a13f5207b --- /dev/null +++ b/full_models/rmy-script_cyrillic/vocab.txt @@ -0,0 +1,37 @@ +ж +с +м +c +у +й +ч +п +- +р +ы +т +щ +я +ф +б +г +з +о +ш +а +— +и +ю +ц +в +ь +ё +д +л +е +н +к +_ +э +х + diff --git a/full_models/rmy-script_latin/D_100000.pth b/full_models/rmy-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bfa44fe811ff8a7c5e8ebcfe4d62968f575a2388 --- /dev/null +++ b/full_models/rmy-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef503c4b5b33890c5985c574fc53e327ec106fc93291d7b98ce9d12372f4210 +size 561078074 diff --git a/full_models/rmy-script_latin/G_100000.pth b/full_models/rmy-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..649d57f83263d3b59171797dd420bfeb89b2e289 --- /dev/null +++ b/full_models/rmy-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbcf63a44a50b245085dceb03514092a8a5e8390bc026fbfeedbfb0fd2c99e25 +size 436351563 diff --git a/full_models/rmy-script_latin/config.json b/full_models/rmy-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rmy-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rmy-script_latin/vocab.txt b/full_models/rmy-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7743b4452ca6b25368632481b7ec9cb5563a570f --- /dev/null +++ b/full_models/rmy-script_latin/vocab.txt @@ -0,0 +1,28 @@ +| +a +e +i +o +l +n +k +t +r +s +d +p +u +m +v +g +h +c +b +z +j +f +— +ñ +' +8 + diff --git a/full_models/rng/D_100000.pth b/full_models/rng/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a0027f3540ceb616c79aa1e65a68a1ae16cd7f5f --- /dev/null +++ b/full_models/rng/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79d7112eb1edb2d42dc16dd1e417d30060cee76ae9f84c0f0b9e597c54334c1 +size 561078859 diff --git a/full_models/rng/G_100000.pth b/full_models/rng/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f6e6ea28a15a19aefc14c58dca98957ade2657f --- /dev/null +++ b/full_models/rng/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdae0a20142acbe751a69df9b225054da95201945dedc076da8674414839f4d1 +size 436395974 diff --git a/full_models/rng/config.json b/full_models/rng/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rng/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rng/vocab.txt b/full_models/rng/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..22d5c28b5386fd9e0d946a1f5006d081d2f9e630 --- /dev/null +++ b/full_models/rng/vocab.txt @@ -0,0 +1,44 @@ +| +a +i +n +u +k +e +l +b +m +h +w +o +t +y +s +g +ḍ +ŝ +š +f +' +ṛ +ṅ +p +d +ṭ +r +- +ḇ +z +v +c +ž +ṡ +ẹ +ṁ +ṣ +ï +— +ẑ +ḳ +ị + diff --git a/full_models/rnl/D_100000.pth b/full_models/rnl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..87a5a11e7d5ff419959de100ebbc8fa9b7decd90 --- /dev/null +++ b/full_models/rnl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15b71b4913dd785cb55b7c34ddd6968c5fa72c4a0852f3eab17332ed0c847b07 +size 561078862 diff --git a/full_models/rnl/G_100000.pth b/full_models/rnl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..097d525bc1afd8c00b87dfbee3139956686d85e9 --- /dev/null +++ b/full_models/rnl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db1e5f3d7615ab588483318253405d584c139c376ef312e5d818e646c062a4d2 +size 436375856 diff --git a/full_models/rnl/config.json b/full_models/rnl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rnl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rnl/vocab.txt b/full_models/rnl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c60c699e93b1cb9cdcaa94581214db4b6a6fa880 --- /dev/null +++ b/full_models/rnl/vocab.txt @@ -0,0 +1,36 @@ +0 +_ +u +e + +q +p +ē +d +k +v +ī +f +t +a +j +z +b +o +s +i +1 +2 +n +g +l +- +c +m +ō +h +3 +ā +' +r +ū diff --git a/full_models/rol/D_100000.pth b/full_models/rol/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bb146751516261abeb400e020ce5fa6067c17bf0 --- /dev/null +++ b/full_models/rol/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6e0ba07c2d139729f9f68846e3fced013608776164be9f35f6f55c8d2cf7cd1 +size 561079343 diff --git a/full_models/rol/G_100000.pth b/full_models/rol/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..23055f2474634f307d19b5cfb105a2685db0a07d --- /dev/null +++ b/full_models/rol/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fc9ca4459d5a6602ad6b7a52eef405d63ae1c81da3ccb7f0c75a8b62f54c431 +size 436400185 diff --git a/full_models/rol/config.json b/full_models/rol/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rol/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rol/vocab.txt b/full_models/rol/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..28822f5177beb0432cf6d1776556eeb975035426 --- /dev/null +++ b/full_models/rol/vocab.txt @@ -0,0 +1,46 @@ +c +0 +w +4 +- +h +5 + +k +ñ +z +' +d +o +6 +9 +t +a +p +r +x +u +7 +2 +3 +8 +e +á +à +s +è +l +ì +f +q +1 +_ +j +y +v +ò +g +i +m +n +b diff --git a/full_models/ron/D_100000.pth b/full_models/ron/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6a263c389c53269ca55870604b671a5d69def5b9 --- /dev/null +++ b/full_models/ron/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c2469004a0ef4de20edc15b91f618f64c2641a3043cfeb225acd04c9301605 +size 561110140 diff --git a/full_models/ron/G_100000.pth b/full_models/ron/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e66c3cd302a5c13afdc37c64022f111001df4a68 --- /dev/null +++ b/full_models/ron/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917840da2425062c0097eb85d79f2c676391cc2cc3acd098507c27c62bef6db1 +size 436608497 diff --git a/full_models/ron/config.json b/full_models/ron/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ron/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ron/vocab.txt b/full_models/ron/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..3a03c014541dc655bb23d27de1278e8c30cf3760 --- /dev/null +++ b/full_models/ron/vocab.txt @@ -0,0 +1,34 @@ +c +q +u +b +g +_ +n +– +m +z +i +t +l +ă +f +ș +a +1 +î +p +- +h +s +' +x +e +j +â + +r +v +o +ţ +d diff --git a/full_models/rop/D_100000.pth b/full_models/rop/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a0095eb8b7cfa38872ef42eccec8b305da0bab37 --- /dev/null +++ b/full_models/rop/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d02591f666842de5fc558d8c47a7b0fdfc5f7919b974ca5811a3af5c9512f74c +size 561075669 diff --git a/full_models/rop/G_100000.pth b/full_models/rop/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..85225d7b4cb5fdd8d7646c899dcd701bd3062efd --- /dev/null +++ b/full_models/rop/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6e2555a0ee8451234e8bd02c871458b302dd8ed5c45d4080ced3e3325b636e +size 436322349 diff --git a/full_models/rop/config.json b/full_models/rop/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rop/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rop/vocab.txt b/full_models/rop/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2cb2ee4e2f4d450135b7ee78991b3fd4d691ee61 --- /dev/null +++ b/full_models/rop/vocab.txt @@ -0,0 +1,23 @@ +b +f +n +r +u +j +h + +_ +d +k +i +y +m +e +a +t +w +o +l +s +g +p diff --git a/full_models/rro/D_100000.pth b/full_models/rro/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..09b6353bf93f05d5f0bc0e94324ee8515a45d2d2 --- /dev/null +++ b/full_models/rro/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a700abae5b123f09f02350f8e2b7f1ea43f7b1ac357872786e6a551d58c39844 +size 561079124 diff --git a/full_models/rro/G_100000.pth b/full_models/rro/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c43dfd8d85083027b8189aa74a49bd5ea1788c50 --- /dev/null +++ b/full_models/rro/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08e177e6aea30506e2bf924d45f4572e96dd28569bbd2a4f3fa3bfe9f966a6c +size 436371897 diff --git a/full_models/rro/config.json b/full_models/rro/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rro/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rro/vocab.txt b/full_models/rro/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..22f6e2807ab36aa0d9afc6da94767045b5033e0d --- /dev/null +++ b/full_models/rro/vocab.txt @@ -0,0 +1,33 @@ +u +l + +— +t +k +5 +1 +v +4 +h +d +ṯ +e +o +f +a +_ +i +n +g +y +0 +w +9 +3 +' +ṉ +b +s +p +m +r diff --git a/full_models/rub/D_100000.pth b/full_models/rub/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bd9dc6c59e861da5406e57c076eddf61e663e3a0 --- /dev/null +++ b/full_models/rub/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57a958968b6266a56fd7cfccd09c85b7385955b6440f2ef26ccbecbaa535ad3e +size 561078630 diff --git a/full_models/rub/G_100000.pth b/full_models/rub/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9d894ae5e581d55db2132aa8d2f12ba34e167188 --- /dev/null +++ b/full_models/rub/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884f1c74816bafb1320bd7f79ab9a59fde617132d1be83f3348cf8fcd40c0f00 +size 436374846 diff --git a/full_models/rub/config.json b/full_models/rub/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rub/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rub/vocab.txt b/full_models/rub/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..26c28c66bd2e9783e834c231809c653e2ac9bf15 --- /dev/null +++ b/full_models/rub/vocab.txt @@ -0,0 +1,36 @@ +i +k +w +_ +u +z +b +o +t +a +ʼ +— +0 +s +e +c +- +̯ +p +4 +f +j +' +̱ + +l +r +g +y +h +d +v +n +ŋ +3 +m diff --git a/full_models/ruf/D_100000.pth b/full_models/ruf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8c5666e2136366e2f4e21cef46c8cbfa2ef251bb --- /dev/null +++ b/full_models/ruf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:809bdfb2d25f472789b4736e04aad8abef494550771b0c59cadf6e1d45d56c37 +size 561078890 diff --git a/full_models/ruf/G_100000.pth b/full_models/ruf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..305a75b3bdee4dc3f0fd7416f22f85ecf6561cbc --- /dev/null +++ b/full_models/ruf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78071d54dd686113aabdcdd4ab8a2aefaa7d4b40e8c31f111fc25f0418f0c16d +size 436372090 diff --git a/full_models/ruf/config.json b/full_models/ruf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ruf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ruf/vocab.txt b/full_models/ruf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..00d3e9d48131cd6a0afa72b824115fe434586af8 --- /dev/null +++ b/full_models/ruf/vocab.txt @@ -0,0 +1,34 @@ +m +z +d +3 +1 +e +g +u +0 +i +' +h +w +t +s +5 +o +v +f +_ +- +c +r +k +a +l +j +y +b +n +7 + +p +2 diff --git a/full_models/rug/D_100000.pth b/full_models/rug/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..455111739123bee4dc42b5c4958c52dbf0162101 --- /dev/null +++ b/full_models/rug/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fefb58c4b23b8e07886da3b327cef4a60635ea8398794ba42dbb876c939dc127 +size 561078879 diff --git a/full_models/rug/G_100000.pth b/full_models/rug/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..88e04992801b8e85b4cc99873f7de9861b8470a3 --- /dev/null +++ b/full_models/rug/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ff8d6a6f2d0c87e348881d2d6b06aff6893a90f59e8e968f3ebe301277db40 +size 436351167 diff --git a/full_models/rug/config.json b/full_models/rug/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rug/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rug/vocab.txt b/full_models/rug/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..493763157516b1fbc6cf6b76a4a60a70e09fe5dc --- /dev/null +++ b/full_models/rug/vocab.txt @@ -0,0 +1,25 @@ +| +a +i +e +s +u +o +n +t +k +r +m +p +l +g +v +d +b +h +ṉ +z +q +' +- + diff --git a/full_models/run/D_100000.pth b/full_models/run/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1915d1026f88f55230b485a71639dbc2d79efac0 --- /dev/null +++ b/full_models/run/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a42fcc8863aaaf5f3a22bdf88381680baf4cffd2f18b1f968f20474efec31a +size 561078459 diff --git a/full_models/run/G_100000.pth b/full_models/run/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a5c261108b068487825c63f1a49a26bbb2bbe94d --- /dev/null +++ b/full_models/run/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e32218c87307fa1e1de85b60dfdf53032762287e21cb1801f5fa2d4740462f9d +size 436357434 diff --git a/full_models/run/config.json b/full_models/run/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/run/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/run/vocab.txt b/full_models/run/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0970310adeac6d9b457a4171ab9d43b79949d5cd --- /dev/null +++ b/full_models/run/vocab.txt @@ -0,0 +1,29 @@ +| +a +i +u +n +e +r +o +b +m +k +w +y +g +t +s +h +z +' +d +v +c +j +p +f +l +- +— + diff --git a/full_models/rus/D_100000.pth b/full_models/rus/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..66c3b132d2bbd5658f113c2a4dd99e4cec8e3b02 --- /dev/null +++ b/full_models/rus/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a611ba9dd766e04fd657e44399a53146d9952c08aaa78cc229af5a59ef1d82 +size 561110354 diff --git a/full_models/rus/G_100000.pth b/full_models/rus/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b763f8d961079805308bce9c17e4ad70a967b33b --- /dev/null +++ b/full_models/rus/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68a669a88f7fe7e3f9a73dc8d3f6854b83edd318f57f81417731e49044d0cf98 +size 436632962 diff --git a/full_models/rus/config.json b/full_models/rus/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/rus/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/rus/vocab.txt b/full_models/rus/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..8d0df6edfd962d06c43e3690cf72847fc4ae2e94 --- /dev/null +++ b/full_models/rus/vocab.txt @@ -0,0 +1,44 @@ +ч + +д +ь +я +й +с +у +а +о +2 +0 +ъ +ы +н +л +ж +х +ш +з +c +_ +п +m +ю +э +р +4 +щ +o +– +ф +q +и +ц +к +1 +е +б +- +т +в +г +м diff --git a/full_models/sab/D_100000.pth b/full_models/sab/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9bbfb4ac79fd842f3210876ce452811493ccddeb --- /dev/null +++ b/full_models/sab/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5820e7b942f3abaa26e364759bf6a1fb51c5c44c50878bd80fb705526d62fd58 +size 561076181 diff --git a/full_models/sab/G_100000.pth b/full_models/sab/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d304ddcde8b7c5e9f8f01b81ce52eb683b9ad5d3 --- /dev/null +++ b/full_models/sab/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b485a6f7f399b0f20ffe635d9afd3e4786646dadc35dada74e166deccbe04845 +size 436357973 diff --git a/full_models/sab/config.json b/full_models/sab/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sab/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sab/vocab.txt b/full_models/sab/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..71a6e500350558a26c531d45674ffd7ac0de293f --- /dev/null +++ b/full_models/sab/vocab.txt @@ -0,0 +1,37 @@ +| +a +e +i +g +l +u +n +b +t +k +o +r +c +h +d +m +w +s +j +ñ +p +é +— +í +f +v +á +- +ó +z +q +y +ú +x +' + diff --git a/full_models/sag/D_100000.pth b/full_models/sag/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7e831509523fe9aa221f58507e4ac32ac2cd4133 --- /dev/null +++ b/full_models/sag/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd88f8e1b3765397a388b1de329df4c25b5739d536fdb93c04170c2c2171dca +size 561078846 diff --git a/full_models/sag/G_100000.pth b/full_models/sag/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0650084451cea9d39c0c9e76dbb1ee2fe7d77ab8 --- /dev/null +++ b/full_models/sag/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed5389e00f1b211aa6690f718bb2b75a11c85eb31f36105c302de60abd7e2810 +size 436383807 diff --git a/full_models/sag/config.json b/full_models/sag/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sag/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sag/vocab.txt b/full_models/sag/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6cb458fb00eae8c1236b12f9eee45222443a87e2 --- /dev/null +++ b/full_models/sag/vocab.txt @@ -0,0 +1,40 @@ +| +a +i +e +n +o +t +l +g +s +k +b +m +y +u +z +p +r +d +ë +w +f +h +â +- +j +é +ö +c +v +ê +ï +ô +– +' +q +x +è +î + diff --git a/full_models/sah/D_100000.pth b/full_models/sah/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..578bd2e83755920663c2b815780562a7f964c901 --- /dev/null +++ b/full_models/sah/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2bb8871482c300ff3408c1b8cc11b76af093205f26efed0f9f9664c8db519df +size 561078981 diff --git a/full_models/sah/G_100000.pth b/full_models/sah/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d5dfd5ce1b417cbfdccc2208dae97f18a71918ae --- /dev/null +++ b/full_models/sah/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ff7c5c2ce04b24cc620f94092ae23d80e754e4687edf722b365c8add04d4e8 +size 436396083 diff --git a/full_models/sah/config.json b/full_models/sah/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sah/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sah/vocab.txt b/full_models/sah/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..000fa4d9a5baf069f36d35be58d2291d0ccd85d8 --- /dev/null +++ b/full_models/sah/vocab.txt @@ -0,0 +1,44 @@ +ю +у +й +h +р +в +ь +һ +т +– +з +с +ы +э +п +ф +н +б +я +ж +х +c +к +о +_ +a +а +ҥ +ү + +ц +ч +и +i +м +д +ҕ +е +г +3 +ө +л +- +ш diff --git a/full_models/saj/D_100000.pth b/full_models/saj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6b7e5e3f75c834b96db20497f45b36ed6ed84fe7 --- /dev/null +++ b/full_models/saj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7edeb86b498ed9766ac16cd410514ecd4341fc5f0857cad405c1fae0904f2f7c +size 561077938 diff --git a/full_models/saj/G_100000.pth b/full_models/saj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f7c8bc135c08ed5293cd26d3b9d66ffcda1b6de --- /dev/null +++ b/full_models/saj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d113bcc7fc070120844311950751a40ca906e09b3b200e9368528e4c0224c778 +size 436350360 diff --git a/full_models/saj/config.json b/full_models/saj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/saj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/saj/vocab.txt b/full_models/saj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..39c76409a8257f1fcc43c3286c0dc4d1293b1228 --- /dev/null +++ b/full_models/saj/vocab.txt @@ -0,0 +1,30 @@ +ḇ +d +a +c +s +z +e +l +- +' +b +_ +k + +o +j +p +n +ḏ +h +m +i +f +r +y +̱ +g +u +t +w diff --git a/full_models/saq/D_100000.pth b/full_models/saq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a8b3b5f75d07a366e9ce8272926ca3466ba411b8 --- /dev/null +++ b/full_models/saq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19acfb0c86aed971142e09ebeb7f7c6e2ad78d7f9ac0a5205f26f89e61b1e8f2 +size 561078221 diff --git a/full_models/saq/G_100000.pth b/full_models/saq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..58f31d87e8ecfbf2288a2fb982f29d103e56202e --- /dev/null +++ b/full_models/saq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8fe829dee8180cac7c599ad0d95e7d29dd03be701f42522905289bd82f0300c +size 436372760 diff --git a/full_models/saq/config.json b/full_models/saq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/saq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/saq/vocab.txt b/full_models/saq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..696a3f4631cb69dac50f6999d82f150ed3b0f9f0 --- /dev/null +++ b/full_models/saq/vocab.txt @@ -0,0 +1,36 @@ +7 +u +o +k +8 +n +2 +- +h +a +m +5 +g +r +t +b +i +s +9 +l +6 +p +e +1 +c +y +' +d +_ + +0 +j +3 +꞉ +4 +w diff --git a/full_models/sas/D_100000.pth b/full_models/sas/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1472a1b20c7ca39fbe633a9782dea838da84122 --- /dev/null +++ b/full_models/sas/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71565507a32b34783e14965429efb0c290470bf54816cebfdcb90d64e3201815 +size 561078598 diff --git a/full_models/sas/G_100000.pth b/full_models/sas/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bc29bdb9656df9ffbc674201445348632ffd8aa5 --- /dev/null +++ b/full_models/sas/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7730f40778b97dc9259c4eb885aff2da35e8330e8396bc4c3f2a81f334be996a +size 436359850 diff --git a/full_models/sas/config.json b/full_models/sas/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sas/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sas/vocab.txt b/full_models/sas/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9a8a45e86dbc1f89bf974b2cc1af2bfe586d46ca --- /dev/null +++ b/full_models/sas/vocab.txt @@ -0,0 +1,30 @@ +| +a +e +n +i +s +d +t +g +q +l +u +m +k +p +r +ẽ +b +h +o +j +- +y +w +c +' +z +f +é + diff --git a/full_models/sba/D_100000.pth b/full_models/sba/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4c6668a60b1682c7730dbf8075ac35824477ae7 --- /dev/null +++ b/full_models/sba/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9afccf2d8541256c89263ce255d414712934085e7cd02f3558669470b680166 +size 561078725 diff --git a/full_models/sba/G_100000.pth b/full_models/sba/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a122bcbe531a96141a44eeae3d95c0c76f4035d0 --- /dev/null +++ b/full_models/sba/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d22603fe24200db32e0c7a0e63a0b7160386656fa0f6d6f211a9fa75923b2d +size 436407885 diff --git a/full_models/sba/config.json b/full_models/sba/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sba/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sba/vocab.txt b/full_models/sba/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6c417b0f6935b0ca653b058853cf26de9acec6e4 --- /dev/null +++ b/full_models/sba/vocab.txt @@ -0,0 +1,50 @@ +| +a +e +ə +g +n +d +l +m +r +o +i +j +k +t +ɔ +é +s +' +́ +b +u +w +ḛ +y +ŋ +ɓ +- +̰ +í +á +p +ḭ +è +ɛ +ó +à +ò +ɗ +h +ú +ṵ +̀ +ǝ +2 +1 +v +4 +3 + diff --git a/full_models/sbd/D_100000.pth b/full_models/sbd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..382a9ae5592b78c910e50ad01195852b13445b75 --- /dev/null +++ b/full_models/sbd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7836711c8a2587c1bcc296e2ffce5a88d501ceb49d89a50dd255d975fb06c700 +size 561078637 diff --git a/full_models/sbd/G_100000.pth b/full_models/sbd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2c0b19b8cf0e4e925ca17d4192f840b1b1e2ab8c --- /dev/null +++ b/full_models/sbd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072dcf68419f50961d3933786c0730648c974abebcadf410503086cb1bb10262 +size 436408220 diff --git a/full_models/sbd/config.json b/full_models/sbd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sbd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sbd/vocab.txt b/full_models/sbd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..71f6c2924f22c80bf86c3722ecac9921c1372ead --- /dev/null +++ b/full_models/sbd/vocab.txt @@ -0,0 +1,51 @@ +| +a +n +ɛ +i +l +ɔ +k +o +b +m +d +w +e +g +s +r +u +á +t +y +́ +ǹ +p +z +ã +ə +à +̃ +‐ +̀ +f +í +ĩ +ǎ +ì +ũ +h +ò +ǐ +ù +ú +— +ń +v +è +é +ó +̌ +- + diff --git a/full_models/sbl/D_100000.pth b/full_models/sbl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..63102c9025d471b08a34852215bccea6ebaf611c --- /dev/null +++ b/full_models/sbl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0a6402e428699c44bdc5f251d5f7560566813fd907dac1b345c702b908cddf +size 561078633 diff --git a/full_models/sbl/G_100000.pth b/full_models/sbl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b9e7a7d298740740b3d64549b534c960bd5c32e0 --- /dev/null +++ b/full_models/sbl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a85388e5c2f32b60bf9aa764e390de6601d73d806727bd1372e19e9ef834343 +size 436357462 diff --git a/full_models/sbl/config.json b/full_models/sbl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sbl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sbl/vocab.txt b/full_models/sbl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5bbb58a74d322d57a061456f958fec4b47bccbbd --- /dev/null +++ b/full_models/sbl/vocab.txt @@ -0,0 +1,29 @@ +a +| +n +i +o +y +m +h +t +k +g +l +p +- +b +w +s +r +e +d +à +ò +è +̇ +̀ +' +ì +— + diff --git a/full_models/sbp/D_100000.pth b/full_models/sbp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f5cb0d9cd51a8f4d6f12cbe28449c66108561a7 --- /dev/null +++ b/full_models/sbp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85bf3a50c4f1fb8cdd16adada2fc786d9edc05646e35cfb7e836e70b17964877 +size 561078965 diff --git a/full_models/sbp/G_100000.pth b/full_models/sbp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..62559f993f85701f1ad87490727cbd88b1b8ed2f --- /dev/null +++ b/full_models/sbp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8ae6a5d3d3b74229991f1bedc2ae3c0957f4d02e2e858540caf4497fc191ce +size 436356830 diff --git a/full_models/sbp/config.json b/full_models/sbp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sbp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sbp/vocab.txt b/full_models/sbp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d4f46419ec25925467826d18f6988590c12c5698 --- /dev/null +++ b/full_models/sbp/vocab.txt @@ -0,0 +1,27 @@ +_ +l +y +v + +j +' +g +h +ʼ +n +s +d +p +f +b +k +e +- +t +á +i +u +o +m +a +w diff --git a/full_models/sch/D_100000.pth b/full_models/sch/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..efa665193e8b9ff506a27237dbf9955f0158f770 --- /dev/null +++ b/full_models/sch/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8615cf083dc0c13559ecbb064f35aa8c9c1a30891a134ecbd984934798dd7b +size 561078960 diff --git a/full_models/sch/G_100000.pth b/full_models/sch/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0ee32a492ba105396d97d3d3a6986231abd19a04 --- /dev/null +++ b/full_models/sch/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0bd0c2189c85e3eb1b373a490df30e30c0c22f9ff74a906483e95b7ce1d12e6 +size 436385937 diff --git a/full_models/sch/config.json b/full_models/sch/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sch/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sch/vocab.txt b/full_models/sch/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bf8c1ddef7c6843be713b778e7fac4c3dec8fcec --- /dev/null +++ b/full_models/sch/vocab.txt @@ -0,0 +1,40 @@ +f +x +3 +g +y +j +û +s +e +4 +â +d + +a +ô +- +l +c +ê +z +p +_ +u +h +w +k +n +' +q +b +1 +v +0 +î +— +m +r +i +t +o diff --git a/full_models/sck/D_100000.pth b/full_models/sck/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e8cac4c83fce05a7016b4b9c8387a3e03d53bbb2 --- /dev/null +++ b/full_models/sck/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd547b2e7de02a7986e23844bc09ddb14efbe5ecff131a58dcceadc86f38ba61 +size 561079342 diff --git a/full_models/sck/G_100000.pth b/full_models/sck/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..09fc8645bef4742cb24cba116022af916acd2efc --- /dev/null +++ b/full_models/sck/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:288a093c6c300e2ca80f18fd3c7dff9b194b18916becc7e00f4dc475fde3fb4e +size 436433825 diff --git a/full_models/sck/config.json b/full_models/sck/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sck/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sck/vocab.txt b/full_models/sck/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..06f7e56af5da57f6b31cb7e5fd834d41f650b7af --- /dev/null +++ b/full_models/sck/vocab.txt @@ -0,0 +1,60 @@ +ढ +ः +ऊ +च +त +ी +ु +भ +ं +प +द +आ +ृ +ड +न +य +श +ट +घ +उ +_ + +म +े +इ +फ +ै +थ +स +व +ठ +अ +् +ल +ण +ऐ +ह +ख +ज +छ +‍ +ा +ग +- +ष +ध +ि +ौ +़ +' +ब +ू +क +झ +ो +र +ओ +ञ +ई +ए diff --git a/full_models/sda/D_100000.pth b/full_models/sda/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..804ddbb45ed8a33bad22268fe27707dae8bb723c --- /dev/null +++ b/full_models/sda/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d61da99c96404dc68eb49e0f2eb309c77e37207c3bec9de1966e5279e2ad1e +size 561078859 diff --git a/full_models/sda/G_100000.pth b/full_models/sda/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..74c001b9feded4f417a63ba2c2c0d3dc60ac5138 --- /dev/null +++ b/full_models/sda/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c029e48c89f29c6b8b3a7e750347818a96e422682c3cba8b5b491ff3bb3d034 +size 436361250 diff --git a/full_models/sda/config.json b/full_models/sda/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sda/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sda/vocab.txt b/full_models/sda/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2c66ef13db33310968919fa37e16785e7615f1c4 --- /dev/null +++ b/full_models/sda/vocab.txt @@ -0,0 +1,29 @@ +i +u +' +k +t +p +d +– +z +w +l + +r +a +g +h +- +f +m +ë +y +c +e +s +o +b +n +j +_ diff --git a/full_models/sea/D_100000.pth b/full_models/sea/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2568bc5ce36fc5362328a1a4468ea66767fb6881 --- /dev/null +++ b/full_models/sea/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5308938ea74814546f6c6ab7095b3ad0f14ec55b4e955ad68a8dc66c88c165f +size 561076178 diff --git a/full_models/sea/G_100000.pth b/full_models/sea/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02a3ff979db474cf49840a9ee746bb419796d06e --- /dev/null +++ b/full_models/sea/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de57a2d6d50f54e2aa126ccd20a82436682858573824a5f12eadd1b5adfee4d +size 436362693 diff --git a/full_models/sea/config.json b/full_models/sea/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sea/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sea/vocab.txt b/full_models/sea/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..abc684f04258c77e7ed4336f17ffe27e97d3d169 --- /dev/null +++ b/full_models/sea/vocab.txt @@ -0,0 +1,39 @@ +r +y + +g +2 +m +z +1 +4 +s +q +c +5 +- +h +n +k +' +7 +w +u +o +b +j +i +6 +ñ +d +p +ò +0 +è +f +é +_ +l +e +t +a diff --git a/full_models/seh/D_100000.pth b/full_models/seh/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..894d7d4af64e62f17d3ef2f6518c4c0967ceab4d --- /dev/null +++ b/full_models/seh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd5e009072b9101284f5219684478fbb660b3e44958bd5634a3134f3a9345874 +size 561078883 diff --git a/full_models/seh/G_100000.pth b/full_models/seh/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9d57e2bac10555418f22067dd1ee1753bb29b20e --- /dev/null +++ b/full_models/seh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f7b942496d258f52590c24178a8f3f81899d08390af80a6b122a23d7a3551bf +size 436362917 diff --git a/full_models/seh/config.json b/full_models/seh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/seh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/seh/vocab.txt b/full_models/seh/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..09dff124944c79c60be8a2c2b7d5ff750b7ebbdb --- /dev/null +++ b/full_models/seh/vocab.txt @@ -0,0 +1,29 @@ +a +| +n +i +u +e +k +m +o +w +t +p +d +b +h +y +l +z +s +g +r +c +f +' +j +v +x +- + diff --git a/full_models/ses/D_100000.pth b/full_models/ses/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..979bc12101a623cb50fac134a21d7a169ad597a3 --- /dev/null +++ b/full_models/ses/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a85881ab28d2043d3ff44da3e4ad204a2a8a7bcd233b403f374458e67b6b0adf +size 561078972 diff --git a/full_models/ses/G_100000.pth b/full_models/ses/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8679a1cdc8ec40c084a8031e9f1e8e30a5fb260b --- /dev/null +++ b/full_models/ses/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f18e66eceeb19e76196667a782d2b169bb118469f5915559ebc2516ee59127 +size 436374876 diff --git a/full_models/ses/config.json b/full_models/ses/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ses/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ses/vocab.txt b/full_models/ses/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d4e72fb8b5b86ce6b25213b64caf3a3e857223ec --- /dev/null +++ b/full_models/ses/vocab.txt @@ -0,0 +1,36 @@ +e +a +c +t +ɲ +g +ž +r +y +u +k +i +ã +š +_ +õ +ũ +d +n +s +p +ẽ +z +f +o +h +ŋ +ʼ +j +- + +w +l +m +b +– diff --git a/full_models/sey/D_100000.pth b/full_models/sey/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f39cc0610b68513edfe00c7ad783d90be7ad01e5 --- /dev/null +++ b/full_models/sey/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d693e6c734bed30f17d11653a57765106dcecee7f167eed2adb420d87d0203 +size 561079002 diff --git a/full_models/sey/G_100000.pth b/full_models/sey/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..68ed4aab0db893be38a86147c660b69cf1e8a0a3 --- /dev/null +++ b/full_models/sey/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39de3142b9bada6488bb98ea9520e10d0be60a975f2c35886556a2d51b04298 +size 436381457 diff --git a/full_models/sey/config.json b/full_models/sey/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/sey/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sey/vocab.txt b/full_models/sey/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1c7e687f9ed9d49249eb30380dbcfb47d5d988a1 --- /dev/null +++ b/full_models/sey/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +e +' +ë +u +o +j +p +c +̱ +s +y +r +n +h +t +m +q +ñ +d +l +b +ú +í +é +g +f +z +ó +á +v +̲ +x +k + diff --git a/full_models/sgb/D_100000.pth b/full_models/sgb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2331c81e5640f519e95ca6d7f4ff7244ffa0568c --- /dev/null +++ b/full_models/sgb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6365baaeef76b0306f492fbab0641e4cbf8a5ecb15ae1f5a2faff9713a7ebc9d +size 561078706 diff --git a/full_models/sgb/G_100000.pth b/full_models/sgb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a8c0020ba2d7a1cf15db41a7986fa0c8683a6c80 --- /dev/null +++ b/full_models/sgb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e27d146cb3fee958e4f7c8765b985aba0af885f67ef16f0401483daff32d90 +size 436387522 diff --git a/full_models/sgb/config.json b/full_models/sgb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sgb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sgb/vocab.txt b/full_models/sgb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5dd6287e188f3d118e0a66d429b188376daf5229 --- /dev/null +++ b/full_models/sgb/vocab.txt @@ -0,0 +1,42 @@ +a +| +n +i +y +o +h +m +l +k +t +p +g +ê +b +u +r +s +w +d +e +- +j +c +á +í +f +z +v +q +ú +0 +x +1 +2 +ó +ñ +5 +6 +4 +3 + diff --git a/full_models/sgj/D_100000.pth b/full_models/sgj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..431946d2e37246a99cfe55156502918cf12b4da6 --- /dev/null +++ b/full_models/sgj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c42182617c234a1da95b439f2c25114e89d66a7fb283ea6fd67f814d86094a +size 561076186 diff --git a/full_models/sgj/G_100000.pth b/full_models/sgj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a1294a3db062d78eaeab0076846aec36ba710543 --- /dev/null +++ b/full_models/sgj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee88af22b21b3fa64ec8a47a4f3a909ff7147b4cf7b3e9e51c58e6efbefe2017 +size 436388179 diff --git a/full_models/sgj/config.json b/full_models/sgj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sgj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sgj/vocab.txt b/full_models/sgj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9020d7291ad47252eb20fccd6fd67662ec778aa6 --- /dev/null +++ b/full_models/sgj/vocab.txt @@ -0,0 +1,50 @@ +े +् +' +ट +त +ओ +उ +ो + +ि +ं +ख +थ +ए +ल +ढ +च +र +ब +म +ध +ज +न +ई +ी +ग +़ +ऊ +भ +_ +द +ू +ु +प +- +ड +स +घ +व +य +आ +ह +इ +अ +ा +क +झ +ठ +छ +फ diff --git a/full_models/sgw/D_100000.pth b/full_models/sgw/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..32e37e7f361b0d8b700d21c1ab4eaddbfc3a2486 --- /dev/null +++ b/full_models/sgw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110043cbb1811435ecb3408409f8674d7a648ce183226390baef3ad77553e622 +size 561078965 diff --git a/full_models/sgw/G_100000.pth b/full_models/sgw/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..903912469d430c50abf7598552508b0fffa79254 --- /dev/null +++ b/full_models/sgw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8f35ed3b0fbeb3de4890652e1b41ca4e1f9a826231478edd24e6b7abc342bb +size 436359549 diff --git a/full_models/sgw/config.json b/full_models/sgw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..993d1dedb1d0c8e820b98f9e2f019ff166327038 --- /dev/null +++ b/full_models/sgw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.uroman", + "validation_files": "dev.uroman", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sgw/vocab.txt b/full_models/sgw/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf59b28ae2f095ea42d626e977a7e198fb23c678 --- /dev/null +++ b/full_models/sgw/vocab.txt @@ -0,0 +1,29 @@ + +' +2 +` +a +b +c +d +e +f +g +h +i +j +k +l +m +n +o +p +q +r +s +t +u +w +x +y +z diff --git a/full_models/shi/D_100000.pth b/full_models/shi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7cf741d7eca80c8541eb94416b3fc83d8af92525 --- /dev/null +++ b/full_models/shi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32c2d0a9ec0e97f98e66fd33b4cd95a314a800f94eca4bb2b325dbcdd2e0350a +size 561079010 diff --git a/full_models/shi/G_100000.pth b/full_models/shi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02c300a3fbf0e0bea9e654ce2c9d0fe1abb09e4c --- /dev/null +++ b/full_models/shi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf9258733d0e8b6f11350f7f942bf0cba5918686e7266451e5f2d6908385f61 +size 436379555 diff --git a/full_models/shi/config.json b/full_models/shi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/shi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/shi/vocab.txt b/full_models/shi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0520e2419a135c2318d4aedcd21842fc4a0e9d14 --- /dev/null +++ b/full_models/shi/vocab.txt @@ -0,0 +1,36 @@ +h +j +b +ε +ṣ +ṭ +u +a +š +‐ +ḥ +r +t +f +_ +d +z +q +ḫ +â +s +i +l +k +g +ġ +m +1 +ÿ +n +ḍ +ẓ +w +e + +y diff --git a/full_models/shk/D_100000.pth b/full_models/shk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f59330a133acbdca8e8d2dcb295e1343571b8a83 --- /dev/null +++ b/full_models/shk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aca6ebd994cd11ade2cf647d47b2b90c9c18f41b13c29abaca01ee7d32b529b +size 561078882 diff --git a/full_models/shk/G_100000.pth b/full_models/shk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d017f10f1e853cf5121928111776cb78513187a8 --- /dev/null +++ b/full_models/shk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da2f355b876e037be082d661bdc81a64dc94a5f7790f4cf3e54922bd49da7179 +size 436402514 diff --git a/full_models/shk/config.json b/full_models/shk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/shk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/shk/vocab.txt b/full_models/shk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..23d7295ed695ab47070f205f933d6ca6236082cb --- /dev/null +++ b/full_models/shk/vocab.txt @@ -0,0 +1,47 @@ +| +ɑ +n +i +g +k +e +y +ø +w +d +m +ë +b +l +h +j +r +ï +u +̈ +ö +t +- +o +p +́ +c +ì +ó +s +í +̀ +a +á +è +ù +' +– +— +é +ú +ä +8 +2 +1 + diff --git a/full_models/shn/D_100000.pth b/full_models/shn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8961dd3f103532ffdcac5b5410d56c204bf3a54f --- /dev/null +++ b/full_models/shn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2466404998d82e3ffba0d8955b5838c382aad66b89d30751f3f913d6b0c8a8db +size 561078348 diff --git a/full_models/shn/G_100000.pth b/full_models/shn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ddad28f8eb6b3a72d8f047ae9e0cb50a65f041d3 --- /dev/null +++ b/full_models/shn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac630366f73fbcf16549c09892bf243bbc21b8218ced08ad78457cbbe53dd2f +size 436391873 diff --git a/full_models/shn/config.json b/full_models/shn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/shn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/shn/vocab.txt b/full_models/shn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cecbbec780d8af982e10ff7ab75affa3cfd10f32 --- /dev/null +++ b/full_models/shn/vocab.txt @@ -0,0 +1,44 @@ +| +် +ၼ +ႈ +း +ဝ +ႃ +ၵ +ႇ +တ +မ +င +ူ +ဢ +ႉ +ိ +လ +ၢ +ၸ +ေ +ပ +သ +ု +ႁ +ႆ +ၶ +ႂ +ွ +ဵ +ယ +ႄ +ီ +ၽ +ႅ +- +ြ +ထ +ၺ +ျ +ရ +' +ႀ +ၿ + diff --git a/full_models/sho/D_100000.pth b/full_models/sho/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f9a1510aabf1f4c01541d009f423859d315a5b7 --- /dev/null +++ b/full_models/sho/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b187bb8ed9b6739198841b2e982c5984ffcadc4e8ce7c8c0555de1cf6d9dd1df +size 561078220 diff --git a/full_models/sho/G_100000.pth b/full_models/sho/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..27413d68af617309138da43a5cb200220c89e50b --- /dev/null +++ b/full_models/sho/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:669fef57e46b6d3659027505bb5f255d559bf195438496eec877fc55ef8d93c8 +size 436398650 diff --git a/full_models/sho/config.json b/full_models/sho/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sho/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sho/vocab.txt b/full_models/sho/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..db31fdb83df746103514089e97496a15ebe66a4b --- /dev/null +++ b/full_models/sho/vocab.txt @@ -0,0 +1,48 @@ +| +a +i +ɛ +k +b +n +e +o +d +t +m +g +à +ã +u +l +h +ɔ +ì +z +s +w +̃ +y +̀ +j +á +' +ũ +p +ĩ +c +ò +è +́ +ù +ǹ +f +r +é +ń +ó +ḿ +v +í +ú + diff --git a/full_models/shp/D_100000.pth b/full_models/shp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..df1c580ad75bdb06bee8dba96defbb44c3676441 --- /dev/null +++ b/full_models/shp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d3d8c9d5029bf05b260fcdf16ee9a8d5cb22ae347a9c8d7f725e4686d2d958 +size 561078844 diff --git a/full_models/shp/G_100000.pth b/full_models/shp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82a9d21002b7d368a6043de58be7f92904408c2f --- /dev/null +++ b/full_models/shp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4569e4a6fae1939d9d819ce2b918d408e0c6f569e7046a6ff0cf2c02880bbb0 +size 436379830 diff --git a/full_models/shp/config.json b/full_models/shp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/shp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/shp/vocab.txt b/full_models/shp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c3a01ca3c049e25405cdf73f0b39122f1bf6ba70 --- /dev/null +++ b/full_models/shp/vocab.txt @@ -0,0 +1,37 @@ +a +| +i +n +o +k +e +j +t +b +s +r +m +x +h +y +w +á +p +c +í +d +é +u +l +— +ó +g +ú +f +z +' +v +q +ñ +- + diff --git a/full_models/sid/D_100000.pth b/full_models/sid/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..25ad3647a081ae96957759c427d68aac2b1e7d88 --- /dev/null +++ b/full_models/sid/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9831bbc2d8e8be616c4e44747aa95e61b100703ef5087bebf237ab45d966703 +size 561079123 diff --git a/full_models/sid/G_100000.pth b/full_models/sid/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9fcc24775d7f698cbd88d62670d56af70a91c803 --- /dev/null +++ b/full_models/sid/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5948cdeaf33d206a62fe2cc9f99ed2733fbff3890c247a2248a32e05a2e0909 +size 436382910 diff --git a/full_models/sid/config.json b/full_models/sid/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sid/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sid/vocab.txt b/full_models/sid/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..de9c57a99755e845e7ddcf7b4079b699e91d1bc9 --- /dev/null +++ b/full_models/sid/vocab.txt @@ -0,0 +1,38 @@ +a +| +n +i +o +e +s +h +u +t +r +m +k +l +d +y +g +b +' +c +w +q +f +x +j +p +z +0 +1 +2 +6 +4 +5 +- +3 +7 +8 + diff --git a/full_models/sig/D_100000.pth b/full_models/sig/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7f0dbc7ecfb3db4fe9583f16fec8125de76ba07f --- /dev/null +++ b/full_models/sig/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be82dcebcc6cf19bb23f28319ebb78aa33536406f4c4586d3a7cf93a6451674b +size 561078586 diff --git a/full_models/sig/G_100000.pth b/full_models/sig/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..872a42645e360a416a0295bb533da2c2b785b531 --- /dev/null +++ b/full_models/sig/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5e3a2282a0fdbc7b14250f6fe5d8c02247ff4696f835f5edebcd080b962082 +size 436366802 diff --git a/full_models/sig/config.json b/full_models/sig/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sig/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sig/vocab.txt b/full_models/sig/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ae1aa88aea860ff435cdafee58a60c54655b3a93 --- /dev/null +++ b/full_models/sig/vocab.txt @@ -0,0 +1,33 @@ +| +a +ɩ +y +ŋ +b +ʋ +l +ɛ +e +k +n +s +i +w +m +t +o +d +g +r +h +u +ɔ +p +f +á +v +- +' +z +̃ + diff --git a/full_models/sil/D_100000.pth b/full_models/sil/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ac92c71ee9930abd7d8ee7db8b02e4b3913ef4ac --- /dev/null +++ b/full_models/sil/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c620f3e4d85f6ac29af05a82460e8fbbcf142cf1c0b58b2b85c854b5ac1ffb65 +size 561078881 diff --git a/full_models/sil/G_100000.pth b/full_models/sil/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..52c7ca8d476da8e52ae4b18c2d7a1488837cbedf --- /dev/null +++ b/full_models/sil/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83224e581626c7fe242ba21c51e601b63e8aeaaea65a9b1766936b0b8ca08104 +size 436374300 diff --git a/full_models/sil/config.json b/full_models/sil/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sil/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sil/vocab.txt b/full_models/sil/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..99c1e2cb74c907cccc2a6c6be10cc6e092933fd2 --- /dev/null +++ b/full_models/sil/vocab.txt @@ -0,0 +1,36 @@ +| +a +i +ŋ +u +l +ɛ +n +b +s +m +d +t +e +k +w +r +o +- +ↄ +h +p +y +j +g +c +f +í +z +á +v +' +́ +ú +ɔ + diff --git a/full_models/sja/D_100000.pth b/full_models/sja/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e4d16deff4eaf4a8153bf574b8e3aef381e94081 --- /dev/null +++ b/full_models/sja/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3008fc582c3f81c3fe8fdfc8b30637dfaddb0e1df963d896fade16e88983be +size 561078577 diff --git a/full_models/sja/G_100000.pth b/full_models/sja/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..81819b437be84c080a245de8bce4d0a6688e0e94 --- /dev/null +++ b/full_models/sja/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd175f32edf13a8534cf0606a8b07e02df2e24d15e0d8ae6c86e1ecfcc1f482 +size 436396593 diff --git a/full_models/sja/config.json b/full_models/sja/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sja/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sja/vocab.txt b/full_models/sja/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..edbcef7b89d4fe68e4d0166e314cc75d9ac74b35 --- /dev/null +++ b/full_models/sja/vocab.txt @@ -0,0 +1,46 @@ +a +| +i +e +p +r +' +ã +m +d +t +k +ɨ +o +j +c +u +h +n +b +w +s +õ +– +g +ĩ +l +á +̃ +y +ũ +ẽ +ë +́ +— +ú +é +v +í +f +ó +z +q +ñ +x + diff --git a/full_models/sjm/D_100000.pth b/full_models/sjm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2756c24e2177917d2384262692f4ada8a8890b38 --- /dev/null +++ b/full_models/sjm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4034c874b011b7beb620fbc2f5bca0d873eb4ffc6ab2e559f911870601b273ac +size 561078614 diff --git a/full_models/sjm/G_100000.pth b/full_models/sjm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f38d4d5aa736a59436ae7d6e5fa4f06735d3889c --- /dev/null +++ b/full_models/sjm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b2aea764a171d5a83ba6773756e2b2a50d8ee9c04e9b682fc41b17993d957d4 +size 436362023 diff --git a/full_models/sjm/config.json b/full_models/sjm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sjm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sjm/vocab.txt b/full_models/sjm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..884e4055d73e9af98d5f9b75f6a85ec427042c13 --- /dev/null +++ b/full_models/sjm/vocab.txt @@ -0,0 +1,31 @@ +a +| +n +i +u +m +s +k +t +l +b +y +g +o +ꞌ +p +d +h +e +w +j +r +- +ā +ō +ū +ī +ē +z +c + diff --git a/full_models/sld/D_100000.pth b/full_models/sld/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..83c7f04f28ff65458acfdab410e631c4b507fbcb --- /dev/null +++ b/full_models/sld/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c3604f2383952d711fd351e3545c1929db3e45661f7346f3cb612bfb35907a +size 561078710 diff --git a/full_models/sld/G_100000.pth b/full_models/sld/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5d99ef83bc6fd0d28ab5729c433a02851eb46e3 --- /dev/null +++ b/full_models/sld/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b4cfcda1178071fa1f1b1e40d5e0464ea5d2026f2fcd17f1544c33de4c211dc +size 436399092 diff --git a/full_models/sld/config.json b/full_models/sld/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sld/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sld/vocab.txt b/full_models/sld/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..71135bce0e266755c1ec4972916fba5a19e57500 --- /dev/null +++ b/full_models/sld/vocab.txt @@ -0,0 +1,46 @@ +| +́ +ɩ +ɛ +a +á +n +ʋ +r +w +s +l +ŋ +m +ɔ +k +b +i +t +í +u +h +e +é +z +o +p +d +y +ó +ú +ɓ +c +f +j +̃ +g +v +' +ẽ +ĩ +ã +õ +q +ṹ + diff --git a/full_models/slu/D_100000.pth b/full_models/slu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b56261c34504c96e4ff50e29307e55f5c0f080b --- /dev/null +++ b/full_models/slu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f978f12ace3086421b28ac90a56fad1b096cc14eb93576525c181effee46f645 +size 561076028 diff --git a/full_models/slu/G_100000.pth b/full_models/slu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf727da3c0d29506b615cbd071bc1674712093db --- /dev/null +++ b/full_models/slu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0c7bf82de590dda618fab82a21b3705f90aea5eb27cd5aa2d482068557e231 +size 436333757 diff --git a/full_models/slu/config.json b/full_models/slu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/slu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/slu/vocab.txt b/full_models/slu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9b427ba00da97b288db7bcbdc0a2f38aa6596bfa --- /dev/null +++ b/full_models/slu/vocab.txt @@ -0,0 +1,27 @@ +| +a +e +k +i +y +s +m +r +n +t +o +u +l +d +h +w +b +g +f +j +- +p +z +c +' + diff --git a/full_models/sml/D_100000.pth b/full_models/sml/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6edd636da732e7ca9bcc205354930d9f4d734025 --- /dev/null +++ b/full_models/sml/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddacac9c4d752b9f5cf5a0db5671ca618e7aa1a05cabcf1719344a89a3f74e0d +size 561078633 diff --git a/full_models/sml/G_100000.pth b/full_models/sml/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b2e256b59c38ca5da0601fb42a70a2c7b4dffff4 --- /dev/null +++ b/full_models/sml/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70126af763ac2a697093ad8eae5ad9b0ea68198930deba97634ce2eb46ea39f6 +size 436359837 diff --git a/full_models/sml/config.json b/full_models/sml/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sml/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sml/vocab.txt b/full_models/sml/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3457253de9fffab5577e9e3444212767a84ea350 --- /dev/null +++ b/full_models/sml/vocab.txt @@ -0,0 +1,30 @@ +a +| +n +i +m +u +' +s +k +g +t +l +b +y +p +h +d +o +e +w +ā +r +- +j +ō +ū +ē +ī +­ + diff --git a/full_models/smo/D_100000.pth b/full_models/smo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5169b5b40739dee601e5be34e5ccc81fe5b787e0 --- /dev/null +++ b/full_models/smo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:111cccbbefe01afa049184f2121e4dc0eb111afd7da3471fa4df554c5fbd309c +size 561078855 diff --git a/full_models/smo/G_100000.pth b/full_models/smo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3a91080a337f80f8ff6475c8fa72fe91940fc72f --- /dev/null +++ b/full_models/smo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ba83540d8318cbf697b220b423dce414d3fd35f060ed156bc92813042ea1d36 +size 436353284 diff --git a/full_models/smo/config.json b/full_models/smo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/smo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/smo/vocab.txt b/full_models/smo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9378ffcbcbfa6bfb21274020afd9240368dabf79 --- /dev/null +++ b/full_models/smo/vocab.txt @@ -0,0 +1,26 @@ +o +g +ē +ō +v +u +m +- +p +r +i +f +l +e +t +ā +h +a +_ +n +k +ī +ū + +' +s diff --git a/full_models/sna/D_100000.pth b/full_models/sna/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f8eb2200bfb7a9e748e0e402729a6100e143a1c --- /dev/null +++ b/full_models/sna/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766d1debfa61c5ffd2bd0ebaeeab96e56bf348b8df427ad3e56b7253e7bf8cfb +size 561078976 diff --git a/full_models/sna/G_100000.pth b/full_models/sna/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..6282d61f929ebd5ddbf22929bd5627c07a08cf43 --- /dev/null +++ b/full_models/sna/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30bf33cef4cc4c39c22cd4c22454c652cba3c056138c7ac4097acacf9c8ae86a +size 436370786 diff --git a/full_models/sna/config.json b/full_models/sna/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sna/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sna/vocab.txt b/full_models/sna/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cf28408c83a2e187cab8297fe1d1f04224e004b0 --- /dev/null +++ b/full_models/sna/vocab.txt @@ -0,0 +1,33 @@ +w +a +m +t +b + +v +y +c +n +z +g +1 +o +r +_ +q +' +j +ʼ +l +i +4 +k +e +d +u +- +p +s +f +h +2 diff --git a/full_models/sne/D_100000.pth b/full_models/sne/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7f354f6f7fe54f684be1bde40f1adfeca1794da5 --- /dev/null +++ b/full_models/sne/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99a697eead1f34695eed7cb26ab8f4f20ac5f93c3e330c5416331050fd341740 +size 561078768 diff --git a/full_models/sne/G_100000.pth b/full_models/sne/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d84415f254885e3dd1e6b54393dc6e1c7664cb1a --- /dev/null +++ b/full_models/sne/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdeafbb419c5769ab2d8fdbde1f67bdabc3995e901b733e32cf523ef53ef6017 +size 436384798 diff --git a/full_models/sne/config.json b/full_models/sne/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sne/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sne/vocab.txt b/full_models/sne/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c1a059b296ae429beda2c72b0e18cf5122c76420 --- /dev/null +++ b/full_models/sne/vocab.txt @@ -0,0 +1,40 @@ +| +a +n +o +i +u +d +ꞌ +e +h +g +s +t +k +r +m +p +b +y +j +- +l +w +f +— +z +v +c +0 +x +2 +1 +' +6 +4 +3 +7 +q +5 + diff --git a/full_models/snn/D_100000.pth b/full_models/snn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..98409fe0c1f013f5ee421fd2052092aaac0f85ac --- /dev/null +++ b/full_models/snn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02e77b1ec0a8fb36c75c9ac4ece9d2d79fbf5f6d8de1133602b744e24e17f4b +size 561077684 diff --git a/full_models/snn/G_100000.pth b/full_models/snn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dd11808fccd0dc0380d1dc0763b52053bd1d2a90 --- /dev/null +++ b/full_models/snn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15037d42191b79061a50ee5c7ecc7e4c7dca2c13d3ca61d06ac4063e3026354a +size 436376242 diff --git a/full_models/snn/config.json b/full_models/snn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/snn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/snn/vocab.txt b/full_models/snn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c6bec43422056435cca48be1ab3417bbf022f0c6 --- /dev/null +++ b/full_models/snn/vocab.txt @@ -0,0 +1,41 @@ +2 +0 +y +q +b +4 +ü + +k +p +o +v +l +é +c +m +á +d +i +f +a +ú +1 +z +j +— +s +n +u +g +í +ë +ñ +t +h +e +x +_ +ó +r +' diff --git a/full_models/snp/D_100000.pth b/full_models/snp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..521631c714e8834b1431a33edeed6ac87a2e65c6 --- /dev/null +++ b/full_models/snp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c58c753c985b6e9718d12f739e599d75e2a0ffa196ac2a400b36cdc8256fcd +size 561077555 diff --git a/full_models/snp/G_100000.pth b/full_models/snp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b93897a73581240e4b7aa0cad70495f0f2765443 --- /dev/null +++ b/full_models/snp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2344cb969f76fa8d4954f7b4a95b72ed9e8072520c9aeed509267fb23f025ba +size 436336653 diff --git a/full_models/snp/config.json b/full_models/snp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/snp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/snp/vocab.txt b/full_models/snp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9543e4f996ef2b919213bb133c034b1ce0669ae7 --- /dev/null +++ b/full_models/snp/vocab.txt @@ -0,0 +1,24 @@ +b +a +y +i +l +p +á +n +' +t +w +- +_ +k +f +u +o +m + +s +h +e +g +d diff --git a/full_models/snw/D_100000.pth b/full_models/snw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..13263927e3a43f5424d3c0ae8f6807fe8a6adb87 --- /dev/null +++ b/full_models/snw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b65e41449a4e75fb631b82558e4de3c4ea5c8d85b679f1eeb8fa6ad5245dc399 +size 561078869 diff --git a/full_models/snw/G_100000.pth b/full_models/snw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a8aca3527be96c0aa5d35999782aa20ee19a2216 --- /dev/null +++ b/full_models/snw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b0b6f3960057761ec9bb4d823aace49e2536fc7730833e321e5ae1f00f5dd94 +size 436377749 diff --git a/full_models/snw/config.json b/full_models/snw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/snw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/snw/vocab.txt b/full_models/snw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1a08097489ca3a6cd405862e6978fd9a8d03d718 --- /dev/null +++ b/full_models/snw/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +n +k +o +e +l +ɛ +ɔ +b +u +t +s +y +m +w +f +d +p +ũ +r +ĩ +- +h +g +á +í +ã +v +é +̃ +' +à +ú +́ + diff --git a/full_models/som/D_100000.pth b/full_models/som/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f175d68f050ce8ab15851609c7549770c21c2dbb --- /dev/null +++ b/full_models/som/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53b85db771eec7e2579625793b407d33114ad3dae8a0828da2cd29da77352ac9 +size 561079132 diff --git a/full_models/som/G_100000.pth b/full_models/som/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..8fb08c180db5cc5abbc0840e3d64f0d76d7a3a24 --- /dev/null +++ b/full_models/som/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d65f075ecbae7a189a48b3887af7546af50be3e32292d8afb789d3cf8e874e6a +size 436356938 diff --git a/full_models/som/config.json b/full_models/som/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/som/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/som/vocab.txt b/full_models/som/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1cf083f978b053b568c8a6ff84c42de4da7b1d6d --- /dev/null +++ b/full_models/som/vocab.txt @@ -0,0 +1,27 @@ +u +b + +e +c +' +f +w +l +j +d +n +r +i +g +q +m +t +_ +k +y +o +x +s +- +h +a diff --git a/full_models/soy/D_100000.pth b/full_models/soy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6b036cd647af6e3ae1da07aa507f945cb588ec87 --- /dev/null +++ b/full_models/soy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:743944cedb1465b7f4c1367311d89ae699a9536544604f6b605af29bab22f638 +size 561079377 diff --git a/full_models/soy/G_100000.pth b/full_models/soy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b2e5058b73972b2d2841b8557df770fe8a1bc3cf --- /dev/null +++ b/full_models/soy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34df4f869bc61188485ed9c3850092e8a9c5741937f4e3606d06f837cb3404e9 +size 436401606 diff --git a/full_models/soy/config.json b/full_models/soy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/soy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/soy/vocab.txt b/full_models/soy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4328dd448566841ce34fd3e6c3963e5e9d026630 --- /dev/null +++ b/full_models/soy/vocab.txt @@ -0,0 +1,46 @@ +ɔ +ú +ũ +y +– +t +ɛ +r +ó +é +_ + +ë +w +l +́ +n +o +õ +ɑ +k +f +ṍ +ḿ +ø +i +á +- +c +ṹ +ń +ĩ +ŋ +í +̃ +ẽ +ñ +h +û +e +u +m +a +s +̀ +p diff --git a/full_models/spa/D_100000.pth b/full_models/spa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..09226b73149c02b40a82b36d69eb992a1bc96472 --- /dev/null +++ b/full_models/spa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07ab22829d36992fc47d7fde4d9e1313f2a8108d2442d489a0953b1910628d7a +size 561110151 diff --git a/full_models/spa/G_100000.pth b/full_models/spa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6bce5772dec5ca0c7f76ee292c667cbaa63f9742 --- /dev/null +++ b/full_models/spa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8feb91089b706e231efb18d0038f5827f1a9d1e45c57c61fba7ebe2198a7c1e6 +size 436635085 diff --git a/full_models/spa/config.json b/full_models/spa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/spa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/spa/vocab.txt b/full_models/spa/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..759ed624158f34d7fc0054ac6ceaf1cd492c43d9 --- /dev/null +++ b/full_models/spa/vocab.txt @@ -0,0 +1,45 @@ +7 +a +v +c +— +0 +5 +ó +8 +p +y +z +4 +m +ü +k +s +á +q +h +n +é +_ +9 +1 +f +t + +x +d +í +b +3 +j +g +l +2 +i +u +e +ú +o +ñ +r +6 diff --git a/full_models/spp/D_100000.pth b/full_models/spp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2c6a9f2b929631d04a0de424507cf76edd302817 --- /dev/null +++ b/full_models/spp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ac5e42997d8aab1264e0fd29d3f2ea06d36288499e8fc4288e4fd7dae5fc8e +size 561078452 diff --git a/full_models/spp/G_100000.pth b/full_models/spp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..af6904b0fa1c5a85b4b450b44062dc594f3cec86 --- /dev/null +++ b/full_models/spp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc5058d74bedb97f40772a1caaabbf177bc39bd0b63c429baa5c7ed85dc53cf +size 436408139 diff --git a/full_models/spp/config.json b/full_models/spp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/spp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/spp/vocab.txt b/full_models/spp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cee84f3a310dc530b764c6c7fa6205b1ea532013 --- /dev/null +++ b/full_models/spp/vocab.txt @@ -0,0 +1,51 @@ +| +i +a +n +y +e +u +k +m +p +r +ɛ +s +w +l +à +ŋ +ɲ +h +o +t +g +á +ɔ +b +c +f +' +j +ù +í +ì +è +̀ +d +ú +‐ +z +é +ò +î +́ +û +ê +â +̂ +v +ó +ô +- + diff --git a/full_models/spy/D_100000.pth b/full_models/spy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e963cef7a0f1b4abb34315f757b4cad511024f62 --- /dev/null +++ b/full_models/spy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0bd532458aab0494abce8be3c27344ca279f7a88fe1c699aebda9bf0078b55e +size 561078711 diff --git a/full_models/spy/G_100000.pth b/full_models/spy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..497bf67e9cef08235d7053cee5628d6b465593a2 --- /dev/null +++ b/full_models/spy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a9c5256c22e75780e2f8cbf9aabf2c3f948b358de6598e181f40f4124c550f +size 436359728 diff --git a/full_models/spy/config.json b/full_models/spy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/spy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/spy/vocab.txt b/full_models/spy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..26531bed0685e6a1cdb6cd35c8c15335a81434c9 --- /dev/null +++ b/full_models/spy/vocab.txt @@ -0,0 +1,30 @@ +| +k +o +ē +i +y +u +a +n +t +e +m +ā +ō +b +c +h +r +s +l +w +' +g +- +f +1 +2 +6 +0 + diff --git a/full_models/sqi/D_100000.pth b/full_models/sqi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..18489fe781bfbd21629bb519dd97601f538922cf --- /dev/null +++ b/full_models/sqi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2adf6cda0991e674787f49cefe3bb09a4745d943277f19e8b92977bc9a98806e +size 561078965 diff --git a/full_models/sqi/G_100000.pth b/full_models/sqi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6d1f17271b93799a4deeb27916ce4d18122db0cd --- /dev/null +++ b/full_models/sqi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0110cc041041bde72f81fd27edc043317ad66c69c598dcd2cca7fadd403be325 +size 436370905 diff --git a/full_models/sqi/config.json b/full_models/sqi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sqi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sqi/vocab.txt b/full_models/sqi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b89d09bed6069944c71db2a4d475bc95000e7b2f --- /dev/null +++ b/full_models/sqi/vocab.txt @@ -0,0 +1,34 @@ +| +ë +e +t +i +r +a +n +s +h +j +u +d +o +m +p +k +l +g +b +q +v +z +f +y +ç +' +c +x +- +è +– +à + diff --git a/full_models/sri/D_100000.pth b/full_models/sri/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..fece36e6da489f0829248a52791f2a0321fb9e04 --- /dev/null +++ b/full_models/sri/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b1ab540d1ddfb457db8eb32dfbed8ec06ac77695b8d3476887935b5707793e +size 561078598 diff --git a/full_models/sri/G_100000.pth b/full_models/sri/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..7272e556aad80adf8c2033dd8e3367055e504281 --- /dev/null +++ b/full_models/sri/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:454760e7bb1fd43dadcbc8482f250aff9098cec8c8eeec287fe7a271de283a1c +size 436399011 diff --git a/full_models/sri/config.json b/full_models/sri/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sri/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sri/vocab.txt b/full_models/sri/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dede8983d4aa7cf3e8f2019c71bb29f557d80e1d --- /dev/null +++ b/full_models/sri/vocab.txt @@ -0,0 +1,47 @@ +| +r +a +ã +e +i +ʉ +m +ĩ +g +s +o +u +p +k +̃ +b +d +y +ẽ +j +õ +t +w +n +ũ +ñ +í +́ +á +é +ú +c +l +— +ó +h +f +v +ü +' +ṍ +̶ +z +q +x + diff --git a/full_models/srm/D_100000.pth b/full_models/srm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dd0472a5ddd57c7ca632e7edf126e75129056f78 --- /dev/null +++ b/full_models/srm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f4e328ee8e27fc6c32f7c251c3ee97c769e24943bbfae7418e50ea095dd026 +size 561077993 diff --git a/full_models/srm/G_100000.pth b/full_models/srm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3208e98616b5aacdec83e88adc3e9c432d405299 --- /dev/null +++ b/full_models/srm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e168e1a72818f11bb7fabe6698e9b5e2b7d9e5fc238b11a2c320a94cbefb9177 +size 436375770 diff --git a/full_models/srm/config.json b/full_models/srm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/srm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/srm/vocab.txt b/full_models/srm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..38451ab62f4c14e3b24cfe35f896887b50cf3010 --- /dev/null +++ b/full_models/srm/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +n +u +d +e +ë +s +ö +t +k +o +m +b +f +g +w +h +l +j +p +˻ +˼ +z +' +- +v +0 +ú +1 +2 +4 +í +6 +r + diff --git a/full_models/srn/D_100000.pth b/full_models/srn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82765079c2905f1046f0e752ce9264cb6f635a6e --- /dev/null +++ b/full_models/srn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485cb49e29b1b2cc76c7955722726d9d7ac81958ddda089de9e1a549eceb0f81 +size 561078892 diff --git a/full_models/srn/G_100000.pth b/full_models/srn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7bdae4a903fab4b2c57d63c4cf88d1b3bb74b985 --- /dev/null +++ b/full_models/srn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:234422c34b57a1ffee9775c3d6cc33a3359325cdc41a3464a821f399d173f148 +size 436374602 diff --git a/full_models/srn/config.json b/full_models/srn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/srn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/srn/vocab.txt b/full_models/srn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..47c3a0031b3f58a6c1173e1b72f1ff004d1c6f8d --- /dev/null +++ b/full_models/srn/vocab.txt @@ -0,0 +1,35 @@ +| +a +n +i +e +u +s +d +o +r +k +t +m +f +b +g +w +p +l +y +' +è +h +- +ê +v +ô +0 +j +1 +2 +z +á +c + diff --git a/full_models/srx/D_100000.pth b/full_models/srx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dc006fb7fc32f368688069859a47d9ad3eeb1452 --- /dev/null +++ b/full_models/srx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9efa259f4ffa92f442793e5710038ff9ceae0a558292cd304a10413677aca69d +size 561078720 diff --git a/full_models/srx/G_100000.pth b/full_models/srx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5e9200853e300758bf3ef93896761f1171b5ee46 --- /dev/null +++ b/full_models/srx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4531b3cf58fb19c2504651aea92eec8ef973dbe1b9e8b8c435ea5505f5ee7e11 +size 436439996 diff --git a/full_models/srx/config.json b/full_models/srx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/srx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/srx/vocab.txt b/full_models/srx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..72ca46d79d12d84d58fabb8561e2b698e82b1f23 --- /dev/null +++ b/full_models/srx/vocab.txt @@ -0,0 +1,64 @@ +| +ै +ा +ौ +र +क +त +ी +स +द +ि +ु +म +ज +ब +ं +ो +श +प +न +व +य +ल +ण +औ +े +ह +् +ए +आ +ख +थ +ू +ग +़ +ऐ +च +ई +ड +ट +भ +इ +ध +छ +अ +फ +ओ +ठ +ऊ +‍ +ढ +ष +घ +झ +ँ +- +उ +ञ +' +ृ +0 +4 +1 + diff --git a/full_models/stn/D_100000.pth b/full_models/stn/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..6c4d7c8bfc117fc1fc1b25887c23fb168662413e --- /dev/null +++ b/full_models/stn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543b2424f5e7ab0811849fabbb5e3f8c92a147681e99967733612ebac8ecd78f +size 561078616 diff --git a/full_models/stn/G_100000.pth b/full_models/stn/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..c75b357488d94411568ab3b57fd0081486939feb --- /dev/null +++ b/full_models/stn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c0c623f8f6018492d4ba21749d589c3e2c1d7c66aa8ddfc7346caec2ab6cc6 +size 436357462 diff --git a/full_models/stn/config.json b/full_models/stn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/stn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/stn/vocab.txt b/full_models/stn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..040dc683e53e1379ede546841614ded26f360331 --- /dev/null +++ b/full_models/stn/vocab.txt @@ -0,0 +1,28 @@ +a +| +i +n +r +o +k +g +m +u +e +t +f +w +s +p +q +h +d +j +l +b +v +' +5 +3 +9 + diff --git a/full_models/stp/D_100000.pth b/full_models/stp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4d6aa79efc3426966d353757792b676df34c6661 --- /dev/null +++ b/full_models/stp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc774dec53baa6bc6a488ab2036cd9bd7396ebebd2f1df891ce520c6d0fda413 +size 561076177 diff --git a/full_models/stp/G_100000.pth b/full_models/stp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..11277ccd38d44d055649cee71ae48a671662ec8c --- /dev/null +++ b/full_models/stp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ebfdf3cc77d1a1a44875650b1c12aa2d7196c57cbd149f8da45a847eaf2ab5 +size 436337193 diff --git a/full_models/stp/config.json b/full_models/stp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/stp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/stp/vocab.txt b/full_models/stp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d216ab69f97d6769955719221a1a1d3dbf9ae03a --- /dev/null +++ b/full_models/stp/vocab.txt @@ -0,0 +1,28 @@ +| +a +' +i +u +m +j +h +n +ɨ +g +k +t +b +d +p +o +x +c +ñ +r +s +l +e +ɇ +y +f + diff --git a/full_models/suc/D_100000.pth b/full_models/suc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5596def15c16f01db0e37a58e783d5922f337097 --- /dev/null +++ b/full_models/suc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:764345f2074fb9dea5ebf34a47cff00372296a971e104859f84dee1e42cc695d +size 561078736 diff --git a/full_models/suc/G_100000.pth b/full_models/suc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2dc60e74b6b752c51cde0def44f34bd01a69a16a --- /dev/null +++ b/full_models/suc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84efb39d2d5f16690148339dbaa6e6f894fa05a0bf020f685da1a299e2fefab3 +size 436352143 diff --git a/full_models/suc/config.json b/full_models/suc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/suc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/suc/vocab.txt b/full_models/suc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a0abcae22e3bc3f3a23294b3e7534ada5864316e --- /dev/null +++ b/full_models/suc/vocab.txt @@ -0,0 +1,26 @@ +| +o +n +a +g +i +u +m +k +t +s +l +d +ꞌ +p +b +y +w +r +e +h +' +— +0 +5 + diff --git a/full_models/suk/D_100000.pth b/full_models/suk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f6343fb2dc5ce74189b4c81430f909f2c439e1c5 --- /dev/null +++ b/full_models/suk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4697288f8a1d7d570bfa9ac1672fd8d0f6d2e0fedb0954b95e6750d005bb5a46 +size 561078996 diff --git a/full_models/suk/G_100000.pth b/full_models/suk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c84196bd1bb2319a9119325f914965e26a7e3378 --- /dev/null +++ b/full_models/suk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52c604dac0c5981a6b7f27a158ff22a54232bd5ca90155cabd71c4033a4eb01d +size 436379380 diff --git a/full_models/suk/config.json b/full_models/suk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/suk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/suk/vocab.txt b/full_models/suk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..534e248c09a4d609c8740f9015705ad4f9c1ce43 --- /dev/null +++ b/full_models/suk/vocab.txt @@ -0,0 +1,37 @@ +| +a +n +ū +l +ī +g +e +i +o +b +k +w +h +m +y +u +s +t +j +' +d +z +p +f +c +ò +- +v +ó +à +è +0 +1 +2 +ì + diff --git a/full_models/sun/D_100000.pth b/full_models/sun/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8d98836f3d03cf3392b40ccda210faf4c81483d6 --- /dev/null +++ b/full_models/sun/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad4007da5b4e9fd44d7348f10c7500693f2796aaa49e1f2625dfa419b4a7f49 +size 561078961 diff --git a/full_models/sun/G_100000.pth b/full_models/sun/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..76e04b6687552729f7e18f561c322d5e1d8113e0 --- /dev/null +++ b/full_models/sun/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1efed97706d99b1288e7f998b93e5bb5985ddcdfc5522c456d295732dd2722a0 +size 436380536 diff --git a/full_models/sun/config.json b/full_models/sun/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1f20c1e349fa34cb5c4ec81962ddafa6026954e0 --- /dev/null +++ b/full_models/sun/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 48, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sun/vocab.txt b/full_models/sun/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..762cb1cef0b1f081ffb13b441dcfcc9544fddf84 --- /dev/null +++ b/full_models/sun/vocab.txt @@ -0,0 +1,37 @@ +a +| +n +u +e +i +k +g +r +t +s +l +h +m +d +p +b +j +y +o +w +- +c +' +f +0 +2 +6 +1 +5 +4 +7 +3 +8 +z +9 + diff --git a/full_models/sur/D_100000.pth b/full_models/sur/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..828a5c43cd78147b257c343ba378de489213320f --- /dev/null +++ b/full_models/sur/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f6917198404bce7cc24efde40660d899de61c7caf072e17f48c7c166975896 +size 561078512 diff --git a/full_models/sur/G_100000.pth b/full_models/sur/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c0c0b6749f2c090b821c798b0b795ec6731aa06b --- /dev/null +++ b/full_models/sur/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb0f91ba2d437e1d9be51a9976bb9bece0ade2c08f9b066ff4d2e2a98ba06545 +size 436380448 diff --git a/full_models/sur/config.json b/full_models/sur/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sur/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sur/vocab.txt b/full_models/sur/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..df2141a41470afa4443bec1cfa6f20cc6c96c82a --- /dev/null +++ b/full_models/sur/vocab.txt @@ -0,0 +1,39 @@ +| +i +a +n +e +m +u +k +o +s +r +ɗ +w +g +̶ +t +p +h +l +y +ɓ +b +j +d +f +̵ +ì +c +z +` +í +á +- +à +v +' +ú +é + diff --git a/full_models/sus/D_100000.pth b/full_models/sus/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4c39ce4aee30dcfa82587755e17997861ddeb3d0 --- /dev/null +++ b/full_models/sus/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963ef6f86f0587393b2e7191fefde37722f4fda54b5979987e860ad112c6dba9 +size 561079240 diff --git a/full_models/sus/G_100000.pth b/full_models/sus/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8310a17fc6132f7ceb8e0ffaf61bf1f3a245d73f --- /dev/null +++ b/full_models/sus/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e6da1b1fe88e3411e0d66aa9faf0f5492124356120a557b928df5af136f0072 +size 436356942 diff --git a/full_models/sus/config.json b/full_models/sus/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sus/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sus/vocab.txt b/full_models/sus/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e3919428715857ad325cdd88e787ebb940e066b5 --- /dev/null +++ b/full_models/sus/vocab.txt @@ -0,0 +1,27 @@ +| +a +n +i +x +e +m +ɛ +r +u +b +o +l +ɔ +s +y +t +f +k +d +w +g +ɲ +h +p +- + diff --git a/full_models/suv/D_100000.pth b/full_models/suv/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..b41294405b27431994bdf9aba4dfceb60ff584e9 --- /dev/null +++ b/full_models/suv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4ed47450525af3a0264ce1ef068acf98c8ef118f47c9f2a4c3ae1534ef69ebf +size 561076161 diff --git a/full_models/suv/G_100000.pth b/full_models/suv/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..ddf82d3993e8bf83c61864cb8284185b72a49824 --- /dev/null +++ b/full_models/suv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0de1cb831fd62343941e5379f2196f27f33891d4109a00a2e89497a6608561d +size 436348497 diff --git a/full_models/suv/config.json b/full_models/suv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/suv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/suv/vocab.txt b/full_models/suv/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..4a08ce0e4e021f97d32c52be753dbc089fdda9df --- /dev/null +++ b/full_models/suv/vocab.txt @@ -0,0 +1,33 @@ +a +| +i +n +e +o +u +r +t +k +g +b +l +j +ë +s +h +d +p +m +c +y +w +ü +f +' +v +z +ǃ +ː +̈ +- + diff --git a/full_models/suz/D_100000.pth b/full_models/suz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f1a35016ec98588871497b3e43c7be456d4062e9 --- /dev/null +++ b/full_models/suz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e25aead8ff26cc67b9d828ed62e5f82c1cde99068f823d1014aeb700d516708 +size 561078867 diff --git a/full_models/suz/G_100000.pth b/full_models/suz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2a882d91f268a73b1b83fe89318fe70a34f257b9 --- /dev/null +++ b/full_models/suz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c918938f5f3883dc74cd143da5d1373059a4a0dad4affcff75de888eac6268 +size 436447857 diff --git a/full_models/suz/config.json b/full_models/suz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/suz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/suz/vocab.txt b/full_models/suz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..36b9dc367e78136cfe7ac63d9bfbde44b1e290a8 --- /dev/null +++ b/full_models/suz/vocab.txt @@ -0,0 +1,67 @@ +आ +‍ +ग +ठ +थ +़ +ै +१ +० +म +ा +य +क +त +श +ब +च +ढ +७ +घ +ह +ओ +ल +र +छ +द +_ + +ो +४ +इ +ौ +औ +ं +् +२ +८ +' +ि +३ +ज +प +ख +ध +ऊ +ऐ +झ +५ +भ +ु +ए +६ +न +अ +े +९ +व +उ +ट +ई +ड +- +ी +ू +फ +स +ङ diff --git a/full_models/swe/D_100000.pth b/full_models/swe/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..b09072cedfdca8065e704701a01be23bd5068bcc --- /dev/null +++ b/full_models/swe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a5f722b2910f9e27bc26652e289ac1e22214c9e1d72e74dcd93f55511d8663b +size 561110509 diff --git a/full_models/swe/G_100000.pth b/full_models/swe/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..4923d6895277738b2365be374569b0015b68fe79 --- /dev/null +++ b/full_models/swe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1d9c41935cbfdc8fdaa712a58c7d7b4708f7763a0ddf1cbe0c90b1c0b2fcd75 +size 436617638 diff --git a/full_models/swe/config.json b/full_models/swe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/swe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/swe/vocab.txt b/full_models/swe/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..a6ebc23970f4e0a6f1366c2b428e68f7b34bc5c4 --- /dev/null +++ b/full_models/swe/vocab.txt @@ -0,0 +1,37 @@ +x +e +b +o +l +r +– +j +a +7 +n +m +2 +y + +d +é +s +h +ö +_ +g +' +c +u +- +z +q +f +p +i +6 +å +t +ä +k +v diff --git a/full_models/swh/D_100000.pth b/full_models/swh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f45716651f9db628e5c04f8d4409bf3f06a60e92 --- /dev/null +++ b/full_models/swh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c44c61cfd3778ab247a27de9f7dcbe942301fcc9f43f5fcc05982c8d7c89d183 +size 561110142 diff --git a/full_models/swh/G_100000.pth b/full_models/swh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..75d24a3b72ccf7b3a30cabd8675da2effb4cb527 --- /dev/null +++ b/full_models/swh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b4025e6a8d9aab68a4b252fcdf91a95997029cd2c21fd9f09a4b07318955b59 +size 436621343 diff --git a/full_models/swh/config.json b/full_models/swh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/swh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/swh/vocab.txt b/full_models/swh/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf11713b3ace09a6de26f2dc165ebccbf5a0b46f --- /dev/null +++ b/full_models/swh/vocab.txt @@ -0,0 +1,39 @@ +2 +m +d +r +j +l +s +8 +c +- +k +e +p +0 +g +u +w +7 +4 +b +f +v +i +1 +3 +o +t +6 +z +a +y +5 +n +q + +ʼ +' +h +_ diff --git a/full_models/sxb/D_100000.pth b/full_models/sxb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6a64490620e34c1c0582af4b4829c56a244e6cde --- /dev/null +++ b/full_models/sxb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7776f203181d572ead2cfe76bd1ce0bd15d7f4cfd407d6fda5b59c755fd0ca7f +size 561078842 diff --git a/full_models/sxb/G_100000.pth b/full_models/sxb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6d7571d6ab0fc7f5cff9f378b81d76d11cc3a35c --- /dev/null +++ b/full_models/sxb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b434d34fcf94392e2a0e72d0ff45fee648f38ffa4309e727385c368460d87150 +size 436367249 diff --git a/full_models/sxb/config.json b/full_models/sxb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sxb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sxb/vocab.txt b/full_models/sxb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8c94fe22ef7839bf0407e57475e9240cdad6b95a --- /dev/null +++ b/full_models/sxb/vocab.txt @@ -0,0 +1,32 @@ +r +2 +0 +p +y +t +k +b +m +c +v +h +o +i +- +e + +j +4 +d +z +g +' +n +f +s +u +a +l +1 +w +_ diff --git a/full_models/sxn/D_100000.pth b/full_models/sxn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5846ba480af6ef7ee2ac642ff3a7f4b51f7ad786 --- /dev/null +++ b/full_models/sxn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbc3f4c2ab74098e01121a7a1bd426f6326cd452c365045761f5a05a490d8ab4 +size 561078976 diff --git a/full_models/sxn/G_100000.pth b/full_models/sxn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..38c64825ca8ca140a2bed1eaaee41b64eaf755f4 --- /dev/null +++ b/full_models/sxn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446fafd5d11c314eb0f90132af760017b0b954a748910e51b22b8b9adccc5ac8 +size 436389828 diff --git a/full_models/sxn/config.json b/full_models/sxn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sxn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sxn/vocab.txt b/full_models/sxn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..55ca6581a3a8a3a4df42ed932d69243cd908d283 --- /dev/null +++ b/full_models/sxn/vocab.txt @@ -0,0 +1,41 @@ +| +a +n +e +u +i +g +k +s +m +t +r +l +ẹ +ě +o +̌ +p +w +h +ạ +b +d +᷊ +ụ +ọ +ị +' +y +- +j +f +z +c +0 +ú +4 +1 +ó +2 + diff --git a/full_models/sya/D_100000.pth b/full_models/sya/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d1ee4339519bd7d81c7fbd4ce09873d68ff09ab --- /dev/null +++ b/full_models/sya/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e6f4e3f72d5dafacc3d648f900a555bc9cf55f597962f36ba0bf481c9c2f4c +size 561076027 diff --git a/full_models/sya/G_100000.pth b/full_models/sya/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..462302cd4523f2a06e72beccd3df347773825710 --- /dev/null +++ b/full_models/sya/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b10d2dbd8feefedb5c25666f51a61a5493854f0045656f582cf9a1fa291d44e4 +size 436331314 diff --git a/full_models/sya/config.json b/full_models/sya/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sya/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sya/vocab.txt b/full_models/sya/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c369d02e32b42600e0c94729848fc90f354b7f3d --- /dev/null +++ b/full_models/sya/vocab.txt @@ -0,0 +1,26 @@ +a +j +' +o +c +m +h +b +– +l +u +t +y +e +- +_ +r +w +s +k +i +p + +n +d +g diff --git a/full_models/syl/D_100000.pth b/full_models/syl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cae6436e2087f2ef1ba9336e37b49b8b2861aa44 --- /dev/null +++ b/full_models/syl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a061936831ac550ad788b30fbaf94734b324e122cfa0c927f00117c0f76cecf +size 561076203 diff --git a/full_models/syl/G_100000.pth b/full_models/syl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d3d9e45206b35689bf2238c5d78b6cd157ba36ed --- /dev/null +++ b/full_models/syl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba028de629a1600c26ab249b550d887366343a7bd707f23bcde275f5c502e184 +size 436346666 diff --git a/full_models/syl/config.json b/full_models/syl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/syl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/syl/vocab.txt b/full_models/syl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ecf62874f836a6526f2310d10f46d9a1879988e2 --- /dev/null +++ b/full_models/syl/vocab.txt @@ -0,0 +1,32 @@ +| +a +o +i +r +e +n +t +u +l +m +s +ḳ +b +h +d +z +k +g +f +ṭ +- +ṛ +c +ḍ +j +p +y +ʼ +' +— + diff --git a/full_models/sza/D_100000.pth b/full_models/sza/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a7ceee9ae77c26d2977c5c919f5ac6d75586246f --- /dev/null +++ b/full_models/sza/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d4873a70ba94de87b72309edbc194c76ec52ba045beb05b9a7467edfde8109 +size 561075774 diff --git a/full_models/sza/G_100000.pth b/full_models/sza/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02553b0ce9d5714490798b718e9331200a31463e --- /dev/null +++ b/full_models/sza/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628060b6c0e8d0bdbc5cce152999691773c8fe0431fd92cc0935d8b159561442 +size 436329562 diff --git a/full_models/sza/config.json b/full_models/sza/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/sza/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/sza/vocab.txt b/full_models/sza/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..60f352f905c660d294f341851ef8b794fd5357da --- /dev/null +++ b/full_models/sza/vocab.txt @@ -0,0 +1,26 @@ +w +r +j +c +_ +h +n +– +u +o +t +' +d +p +b +k +g +a + +m +y +- +i +l +e +s diff --git a/full_models/tac/D_100000.pth b/full_models/tac/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fb6f04730681f14ccb714ce0eba22a709be883a2 --- /dev/null +++ b/full_models/tac/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7bdc07cfd55d3b1ddf6336b5150a77a410e2b6494092e3d2349fe52fd69a770 +size 561078728 diff --git a/full_models/tac/G_100000.pth b/full_models/tac/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6db52a7dbc84876ed84ec01e890c37b0ec1899b9 --- /dev/null +++ b/full_models/tac/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff2977881898d6cb79e97b3868435d26c2bc19368268d496c641c42ef715fba +size 436368984 diff --git a/full_models/tac/config.json b/full_models/tac/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tac/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tac/vocab.txt b/full_models/tac/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..709b56ff9b9aba6223d3b9c6f7a6789a4c2c7b36 --- /dev/null +++ b/full_models/tac/vocab.txt @@ -0,0 +1,34 @@ +n +e +ó +i +d +b +v +s +á +r + +p +h +a +í +é +l +f +ñ +_ +y +t +k +— +c +u +w +' +o +g +j +ú +- +m diff --git a/full_models/taj/D_100000.pth b/full_models/taj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..20c035a0041367f4fcb02b5c46838daa02d8d549 --- /dev/null +++ b/full_models/taj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ed9c9c4153f0eab68eeee1ef2872582a277d30c6e4772fba4014049e3d545a +size 561078633 diff --git a/full_models/taj/G_100000.pth b/full_models/taj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff783cde7f4c402ca6d8fb224f8f99bfcf416629 --- /dev/null +++ b/full_models/taj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083427dc27d86765ac7f220b25da190333137cd6f9bc4592e95d92c9803353e4 +size 436436568 diff --git a/full_models/taj/config.json b/full_models/taj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/taj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/taj/vocab.txt b/full_models/taj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8fcf6eee2d513f23de056dc6e3af41d63c670ada --- /dev/null +++ b/full_models/taj/vocab.txt @@ -0,0 +1,63 @@ +| +ा +् +े +‍ +न +म +र +ल +स +ी +ि +द +ब +ह +ग +ङ +ु +य +ो +त +प +ज +थ +च +भ +श +व +क +ख +छ +इ +आ +ए +ू +ध +ै +ओ +ट +ः +फ +अ +उ +ष +घ +झ +ठ +ड +ढ +ण +ँ +ञ +ऊ +ं +ौ +' +ई +ऐ +६ +- +v +औ + diff --git a/full_models/tam/D_100000.pth b/full_models/tam/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..396656b0c39250f30bbbd0447afde8c699dea925 --- /dev/null +++ b/full_models/tam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c967672f3baf02a84e5cc6a7effb98312e4f4d00f8a1a80a815962fb0f7adc9b +size 561110349 diff --git a/full_models/tam/G_100000.pth b/full_models/tam/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aac18741fc32e2859b4328549ead6cca58babf12 --- /dev/null +++ b/full_models/tam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b35ba6789ab5b019d5506f4307f2a51959281df838e749038742660990bbc4 +size 436661740 diff --git a/full_models/tam/config.json b/full_models/tam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tam/vocab.txt b/full_models/tam/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..491a1a901fea2a2edefbf621223b529c2264d881 --- /dev/null +++ b/full_models/tam/vocab.txt @@ -0,0 +1,58 @@ +3 +அ +ஈ +உ +_ +ந +க + +ே +ா +ெ +ஊ +ீ +' +7 +a +ஏ +வ +் +ஹ +ூ +ல +ட +2 +ழ +ர +ம +ஒ +ற +ஞ +ச +9 +ி +ஸ +ை +ன +6 +எ +இ +ய +ௌ +த +ோ +ள +1 +ஆ +ப +0 +ண +ஓ +ங +ு +ஐ +ஜ +4 +ஷ +ொ +5 diff --git a/full_models/tao/D_100000.pth b/full_models/tao/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4a3a3f33181fdc65f563a02c7fe445286aff7f65 --- /dev/null +++ b/full_models/tao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab527a1042d2d39d83c85078012c6e718a3e220707330868f3e56e07772f75c0 +size 561078961 diff --git a/full_models/tao/G_100000.pth b/full_models/tao/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..69d351020e4f2a532b7b0c756133c4e6af67e19c --- /dev/null +++ b/full_models/tao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:871bd3d95156c5fb345b74ba82f785fea96b055e68a838d7171c6ac4f7ae5659 +size 436354142 diff --git a/full_models/tao/config.json b/full_models/tao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tao/vocab.txt b/full_models/tao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ca084997b349d65c3702dda19cda235c25f1ea97 --- /dev/null +++ b/full_models/tao/vocab.txt @@ -0,0 +1,26 @@ +w +k +n +- +a +t +l +r +_ +p +z +o +y +g +i +' +v +s +h +c +j +m +d +b + +e diff --git a/full_models/tap/D_100000.pth b/full_models/tap/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..efd22e09c3f2a303769c4c54d7d66ee314b8ab4b --- /dev/null +++ b/full_models/tap/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c26e68934114fd076be740f5e3e906f0fa6559c76d4747615599ec19fd44609 +size 561078995 diff --git a/full_models/tap/G_100000.pth b/full_models/tap/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a1b0e0830bbecf68c746245bf341859871abbd6b --- /dev/null +++ b/full_models/tap/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c9bcd2ce2ec08a361e2644d0ecf2ba09702f21d6d3929b0f54adf766ac23a0 +size 436376973 diff --git a/full_models/tap/config.json b/full_models/tap/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tap/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tap/vocab.txt b/full_models/tap/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..50bdadd04755245588aa5ce49881aba15b702890 --- /dev/null +++ b/full_models/tap/vocab.txt @@ -0,0 +1,36 @@ +w +g +a + +4 +z +2 +s +b +l +k +d +m +v +0 +n +7 +6 +_ +o +y +t +c +u +5 +' +h +p +3 +r +1 +e +i +9 +8 +f diff --git a/full_models/taq/D_100000.pth b/full_models/taq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d6112fa48c60be99c7c77bb93ee1ba9260e25af9 --- /dev/null +++ b/full_models/taq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deed024bca8b31df7d4d4254f4ceb03bbe527da55af60c4635fb79e9d8737317 +size 561079358 diff --git a/full_models/taq/G_100000.pth b/full_models/taq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..659028b9ff6a94f14135d54b9d611a891e371a11 --- /dev/null +++ b/full_models/taq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf5464685178f7283966ab9590b49fd6899d3122863b23c8956907a451d69591 +size 436382936 diff --git a/full_models/taq/config.json b/full_models/taq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/taq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/taq/vocab.txt b/full_models/taq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ce22c4f87ac1bc76185dd9acb62d57640825a10d --- /dev/null +++ b/full_models/taq/vocab.txt @@ -0,0 +1,38 @@ +w +t +f +ẓ +ă +q +ž +ṣ +ǝ +ĕ +j +' +k +ṭ +- +š +a +ɣ +h +l +e +c +_ +m +n +b +u +i +r +s +d +x +y +ḍ +z +o +g + diff --git a/full_models/tat/D_100000.pth b/full_models/tat/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f8fb53f3cf5170bbecef5aeb05a1e0c7a7a0183e --- /dev/null +++ b/full_models/tat/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21074fd53e25182cf6ecb066ba186ffb9d21f4ecf3be10e6bca28b8c508ab20e +size 561078597 diff --git a/full_models/tat/G_100000.pth b/full_models/tat/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b821e2244e864287226ff8508c2623499ba7490 --- /dev/null +++ b/full_models/tat/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d2ae8bb81e731b3ace866517fed116a298f8b5baf25738f83526abbcf7fb53 +size 436387887 diff --git a/full_models/tat/config.json b/full_models/tat/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tat/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tat/vocab.txt b/full_models/tat/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7719017c77b6625da0b6b32c72cff35b038cb88a --- /dev/null +++ b/full_models/tat/vocab.txt @@ -0,0 +1,43 @@ +| +а +е +ә +н +л +ы +р +к +т +и +г +м +б +д +с +у +з +ш +ч +ү +њ +й +п +ћ +μ +х +я +о +– +ђ +в +ф +э +ь +ъ +ю +- +ѳ +ж +ц +1 + diff --git a/full_models/tav/D_100000.pth b/full_models/tav/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..868dd74ebb5c7c1e614ac66d40aa8e42eb9c62a7 --- /dev/null +++ b/full_models/tav/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69e3ee1476a2fa4163d81489f9e9bf25d58f5168fbadf2f523704ec8c4bd1b8 +size 561078239 diff --git a/full_models/tav/G_100000.pth b/full_models/tav/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ce5b6fd03b104a6db493cfa6edb4b18bcc3e919a --- /dev/null +++ b/full_models/tav/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be7327e502459befd6fd0c7576dbd4c427621e345629ad0f94c071ec1664e6a2 +size 436389542 diff --git a/full_models/tav/config.json b/full_models/tav/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tav/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tav/vocab.txt b/full_models/tav/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..de7b0348e31e06c20a8849f43c235667b9636580 --- /dev/null +++ b/full_models/tav/vocab.txt @@ -0,0 +1,43 @@ + +ã +é +f +n +á +— +r +g +p +õ +_ +v +z +y +s +i +a +k +q +ñ +- +ó +í +l +ʉ +h +c +m +ẽ +ĩ +e +o +j +́ +d +b +ũ +w +u +t +̃ +ú diff --git a/full_models/tbc/D_100000.pth b/full_models/tbc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bb37c34ceb530e47c9ee97f4ef74982204be7cde --- /dev/null +++ b/full_models/tbc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f15d1602f1c03e46beaa00d315e34b8f06a75c767f156c7ad6d8a214fa7506 +size 561078753 diff --git a/full_models/tbc/G_100000.pth b/full_models/tbc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ee541c46bffb441dc2514bb5c1ef1f2d79848d9d --- /dev/null +++ b/full_models/tbc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:861e544e11ee2310145276b284305674bb43aab6366854e8eac29d23aeff9b64 +size 436378582 diff --git a/full_models/tbc/config.json b/full_models/tbc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tbc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tbc/vocab.txt b/full_models/tbc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..adb20975e205ddcbd8bd4e5ec23f0d7c71ede1f9 --- /dev/null +++ b/full_models/tbc/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +n +u +o +d +e +m +l +t +g +ŋ +s +k +p +r +b +y +w +f +j +h +v +0 +1 +2 +' +4 +7 +5 +3 +6 +9 +- +8 + diff --git a/full_models/tbg/D_100000.pth b/full_models/tbg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ff3fea3a7ba61fb25ffa641e4149f665fea99cf --- /dev/null +++ b/full_models/tbg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee62088f44c456cfbd8b84c81042e1168ed2ca7b27a5f47ecf99a61ad882258 +size 561078366 diff --git a/full_models/tbg/G_100000.pth b/full_models/tbg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6f5addfbc07b8261b22834a1668e8a3cc0f31890 --- /dev/null +++ b/full_models/tbg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156014d5d087837a285cd879ff6c58529d465743a90d592518b45ea0f6080bef +size 436382760 diff --git a/full_models/tbg/config.json b/full_models/tbg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tbg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tbg/vocab.txt b/full_models/tbg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2c814f1ee3fcb016dccf8b36d7f0b86534ed4b9f --- /dev/null +++ b/full_models/tbg/vocab.txt @@ -0,0 +1,40 @@ +h +k +u +3 +4 +- +y +á +6 +5 +o +t +q +v +m +˼ +— +i +g +7 +l +­ +b +d +8 +1 +r +2 +n +a +s +9 + +_ +e +f +p +j +0 +˻ diff --git a/full_models/tbk/D_100000.pth b/full_models/tbk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9fd94a976d067cc6da4bf4e2937369dc32335148 --- /dev/null +++ b/full_models/tbk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d119ddcbd59693d59ecf022919ff817942eb00fe25e989bae85a03ca4de746 +size 561076059 diff --git a/full_models/tbk/G_100000.pth b/full_models/tbk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..57655e8af29de745b1d4b0ec45106e2073bef399 --- /dev/null +++ b/full_models/tbk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c876d78d60f6b38b6beb6b97b6d6383f8bd231f2ceabee94789bf1c0f405bd4 +size 436373434 diff --git a/full_models/tbk/config.json b/full_models/tbk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tbk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tbk/vocab.txt b/full_models/tbk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..41ddf9b7cbd00416e3fb3b1227794db7b1341202 --- /dev/null +++ b/full_models/tbk/vocab.txt @@ -0,0 +1,44 @@ +a +| +n +g +u +i +t +m +y +p +s +e +k +r +d +l +̱ +b +w +o +- +j +c +h +f +z +v +q +' +x +1 +̠ +̓ +ë +2 +3 +4 +5 +6 +7 +8 +9 +0 + diff --git a/full_models/tbl/D_100000.pth b/full_models/tbl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ff8bf11eec48dd87d236e4c12243b84b50f7680 --- /dev/null +++ b/full_models/tbl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ddfedc53822a36129a4e30a666c4494061454ce203e70b7d1fd9b1721f6444 +size 561078854 diff --git a/full_models/tbl/G_100000.pth b/full_models/tbl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2db0ceefdcc96a1cfd6a9cd94be4fcedd1b7ac38 --- /dev/null +++ b/full_models/tbl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d2bc5b01abe5b9c102a7f23de44006d99986942dfb6fb4355a4c46312faebc6 +size 436376506 diff --git a/full_models/tbl/config.json b/full_models/tbl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tbl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tbl/vocab.txt b/full_models/tbl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3909cbe5e37e9fc757b76dd1e55166fe22b1305a --- /dev/null +++ b/full_models/tbl/vocab.txt @@ -0,0 +1,36 @@ +ò +ó +j +- + +t +m +k +f +d +' +r +ù +s +w +g +é +ì +à +o +h +ê +e +p +b +i +y +n +è +l +a +u +6 +_ +c +ô diff --git a/full_models/tby/D_100000.pth b/full_models/tby/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..577f3726721ff87a8f50b650bb37755156f5f8af --- /dev/null +++ b/full_models/tby/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:585be05e633039b173906ed5023c0678a2bfa2d339f56e5533f9bd0b3c61c05c +size 561078575 diff --git a/full_models/tby/G_100000.pth b/full_models/tby/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..669cf3fe2e7db605f881cd41c1aaf4676a91f954 --- /dev/null +++ b/full_models/tby/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d9bfa2081eb5ba8f73f3b34a2bf7963a9ddbd667a8659dd0c1b34609950df3 +size 436378158 diff --git a/full_models/tby/config.json b/full_models/tby/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tby/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tby/vocab.txt b/full_models/tby/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8eb587646502fc05489b2f341dd29d77179634d5 --- /dev/null +++ b/full_models/tby/vocab.txt @@ -0,0 +1,38 @@ +| +a +o +i +n +e +u +' +g +k +m +s +d +t +w +r +y +l +b +- +p +j +h +f +c +0 +2 +8 +z +7 +1 +4 +3 +5 +– +6 +9 + diff --git a/full_models/tbz/D_100000.pth b/full_models/tbz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7ce0902fa11762eed0de8ad61cad445ad94d58ee --- /dev/null +++ b/full_models/tbz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f76e32295c98803e723ffcd3d0e6aa14823df2950bcbeb6edeb110e0f1c0ffc +size 561078614 diff --git a/full_models/tbz/G_100000.pth b/full_models/tbz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..55e0bb296008995174536654bf116d5fd2946aa3 --- /dev/null +++ b/full_models/tbz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4b9bc16d3094482bfe6d737c6c0e3c013061de6b6091fd30eada0df71d843a7 +size 436394439 diff --git a/full_models/tbz/config.json b/full_models/tbz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tbz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tbz/vocab.txt b/full_models/tbz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c7c33d71a0288ef3c9de84f02dfecc6a228b8033 --- /dev/null +++ b/full_models/tbz/vocab.txt @@ -0,0 +1,45 @@ +| +ɛ +̀ +k +n +i +ɑ +t +m +́ +d +b +ɔ +u +y +ì +o +̃ +e +í +s +p +ò +ù +r +ó +w +è +ú +c +ĩ +f +h +é +ũ +ǹ +ń +a +ṹ +ḿ +ã +á +- +v + diff --git a/full_models/tca/D_100000.pth b/full_models/tca/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bb3327a89623e5dbd9dc821b993ed7fbfcda421b --- /dev/null +++ b/full_models/tca/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9139319a1540d8f5178fc95b1fa7e9fadaef061990f12bc520a4257f0753ebd1 +size 561078321 diff --git a/full_models/tca/G_100000.pth b/full_models/tca/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7c3ab0230059f9bafab608e591305fcb445e3584 --- /dev/null +++ b/full_models/tca/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f664a36a66e07f1a71f6e6550bdc0a01f39f9dac6bff5233df6ba900d336d7 +size 436433336 diff --git a/full_models/tca/config.json b/full_models/tca/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tca/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tca/vocab.txt b/full_models/tca/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5dcaec022b03e25d9cb86e47d19c4b4402e826b3 --- /dev/null +++ b/full_models/tca/vocab.txt @@ -0,0 +1,62 @@ +| +a +ü +x +n +g +r +u +̃ +c +e +m +i +t +ẽ +h +y +p +ã +̱ +o +w +ĩ +d +ñ +á +í +— +́ +é +ũ +ú +õ +b +s +ó +ṯ +q +ṉ +0 +ḏ +ṍ +1 +l +7 +ḇ +ǘ +ṹ +2 +z +4 +f +- +5 +' +6 +ẖ +8 +3 +9 +k + diff --git a/full_models/tcc/D_100000.pth b/full_models/tcc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dd3a3d2055f1ced0ca888470cd4cde15e14d9687 --- /dev/null +++ b/full_models/tcc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13289373837049697cfd26ee000851a20a1c1fd88de3ff6c45c4ca62823fbf7c +size 561078858 diff --git a/full_models/tcc/G_100000.pth b/full_models/tcc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0ad8b9600cd6157d035887ee5552f2e4a791129a --- /dev/null +++ b/full_models/tcc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09df324a3ae62e6fa88dbcc2c2499ac779423130245a40bc2700a4dc248d6354 +size 436352451 diff --git a/full_models/tcc/config.json b/full_models/tcc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tcc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tcc/vocab.txt b/full_models/tcc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..78f7d26abaec833cdfe242994c94f5a2848329df --- /dev/null +++ b/full_models/tcc/vocab.txt @@ -0,0 +1,26 @@ +l +- +_ +s +h +j +' +p +k +t +o +i +u +b +n +e +m +w +c +a +g +r +f +d + +y diff --git a/full_models/tcs/D_100000.pth b/full_models/tcs/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cadb46cbf342a12eb3bef8815f5bc0faf53d1a3a --- /dev/null +++ b/full_models/tcs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:583b8bab71086dd734eb84ed7a961ddf67e36a8112b9a14b7da7eaba2ee86dcb +size 561075681 diff --git a/full_models/tcs/G_100000.pth b/full_models/tcs/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..28fefd7e0828d4e628af372721211ebb6c6c619c --- /dev/null +++ b/full_models/tcs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ada41412bd2f59f375ca1030219267480d748a46aaecb1f713afe2417b5f13d2 +size 436319833 diff --git a/full_models/tcs/config.json b/full_models/tcs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tcs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tcs/vocab.txt b/full_models/tcs/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6cbb056bfa791ede8339eca50fde847a8eda61ff --- /dev/null +++ b/full_models/tcs/vocab.txt @@ -0,0 +1,22 @@ +| +a +i +e +n +o +m +p +d +l +b +s +t +u +k +g +w +r +z +y +' + diff --git a/full_models/tcz/D_100000.pth b/full_models/tcz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e7b5fd94e4fee75c2d608f769a648f46b2b53001 --- /dev/null +++ b/full_models/tcz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad2056109f346b14ac1365d854c2732cec0bb2ec34081a60e4739564d77f013 +size 561075824 diff --git a/full_models/tcz/G_100000.pth b/full_models/tcz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8fb18aee3e49c751a0cd9e28905495ca1182ec0d --- /dev/null +++ b/full_models/tcz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa3f0ab3ab87594afe850f1bf9d285f15f9429062234af523787dfa4817a3284 +size 436369700 diff --git a/full_models/tcz/config.json b/full_models/tcz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tcz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tcz/vocab.txt b/full_models/tcz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c2b826fc2bf3ccaf1259a240bc6f32437ec9244a --- /dev/null +++ b/full_models/tcz/vocab.txt @@ -0,0 +1,43 @@ +| +a +n +i +g +h +u +t +m +k +r +w +l +e +c +s +p +â +d +o +z +v +ê +b +' +î +- +j +û +ā +ū +á +f +ē +í +é +ī +ó +ȇ +` +ō +ä + diff --git a/full_models/tdj/D_100000.pth b/full_models/tdj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..158aa9b39b447b9750fcfd6372f95e569707c535 --- /dev/null +++ b/full_models/tdj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78699340fd4a036ed777a01ac67eb4f20ae91809a2da54bddd9fb6c0629ac45d +size 561075695 diff --git a/full_models/tdj/G_100000.pth b/full_models/tdj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6fcee609667c222849ad9770554cce88dcc0c200 --- /dev/null +++ b/full_models/tdj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dbb9e4dc17b1d4931bff7c63cde0007f765069ee50a4249613465add74636d2 +size 436331579 diff --git a/full_models/tdj/config.json b/full_models/tdj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tdj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tdj/vocab.txt b/full_models/tdj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b6cd955972018b27ef242cb852960f8e5d19ad23 --- /dev/null +++ b/full_models/tdj/vocab.txt @@ -0,0 +1,27 @@ +y + +i +u +t +h +o +g +j +e +r +l +m +c +w +' +p +- +_ +v +a +ꞌ +k +s +n +b +d diff --git a/full_models/ted/D_100000.pth b/full_models/ted/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..fecd656c57d1a908c4951a3f3cd78e680368d8b7 --- /dev/null +++ b/full_models/ted/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b130bcbdc8b8749fb91c4354999e882d14fdcb9b089ad1352ff4db2c7f222207 +size 561078705 diff --git a/full_models/ted/G_100000.pth b/full_models/ted/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d3df817aa33539999b0c8f1c5fbccf4c92348bc3 --- /dev/null +++ b/full_models/ted/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3bc062c75c3af4fdb10d4d79001686e95acb591871b11b20a65ead84852e3e +size 436366660 diff --git a/full_models/ted/config.json b/full_models/ted/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ted/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ted/vocab.txt b/full_models/ted/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f379d8fec2f6c306f1d0fb94fdde5ce36bd63ac3 --- /dev/null +++ b/full_models/ted/vocab.txt @@ -0,0 +1,33 @@ +| +' +n +a +ʋ +‐ +ɛ +ɔ +e +ɩ +l +y +u +i +k +b +m +o +t +h +꞊ +d +w +g +s +p +r +c +j +f +ŋ +1 + diff --git a/full_models/tee/D_100000.pth b/full_models/tee/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3cdfdb5b9bedb0f3a62e0c17b9667f3f41cb8b00 --- /dev/null +++ b/full_models/tee/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f067dbdf09852222b963ca4b1c8d4322591d47c5dc3f7955474137462096db18 +size 561078583 diff --git a/full_models/tee/G_100000.pth b/full_models/tee/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..260c205abfb110c7159a5e7f4966266454078cb7 --- /dev/null +++ b/full_models/tee/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e0d83a6d5b74ff33b43f10c20636153a9be373cd195fc9914051ae02b079aea +size 436368932 diff --git a/full_models/tee/config.json b/full_models/tee/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tee/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tee/vocab.txt b/full_models/tee/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f3ecd386596e0dc816d522e20b3f891b70386988 --- /dev/null +++ b/full_models/tee/vocab.txt @@ -0,0 +1,34 @@ +ú +í +x +k +o +b +ó +e +y +m +n +h +p +á + +g +ʼ +a +t +s +z +v +i +é +c +ñ +d +f +l +u +j +_ +q +r diff --git a/full_models/tel/D_100000.pth b/full_models/tel/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..88d516916358e6ea558c789f3f0e4b281f1c478b --- /dev/null +++ b/full_models/tel/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:281714bf1cc272990be6220c0643050ede21b8a74a1f32352584993e48d11392 +size 561110494 diff --git a/full_models/tel/G_100000.pth b/full_models/tel/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b189b4f37964a67053ee5d7882e6740b56dea9c5 --- /dev/null +++ b/full_models/tel/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c24d66080fc48b1d0a25c46ff0c052ec06ac6deffcec7703adb67edb10acd7 +size 436681497 diff --git a/full_models/tel/config.json b/full_models/tel/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tel/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tel/vocab.txt b/full_models/tel/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..50e4c53accd063e2b5d353ebfa5f5b0531975ebb --- /dev/null +++ b/full_models/tel/vocab.txt @@ -0,0 +1,65 @@ +త +ఞ +భ +థ +ర +న +ో +ఘ +' +ఐ +గ +ే +జ +ఔ +హ +ా +డ +మ +స + +క +ఒ +ూ +వ +ధ +శ +ౌ +ప +ః +ఠ +ఖ +ష +– +ణ +ఫ +ి +ొ +ఏ +ఎ +ృ +ఓ +య +అ +ీ +ె +_ +చ +ు +్ +ద +ల +ఉ +ఢ +- +బ +ఈ +ట +ఛ +ళ +ఊ +6 +ం +ఇ +ఆ +ై diff --git a/full_models/tem/D_100000.pth b/full_models/tem/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b80ed8cb4ddf4d1c044f749e1759b1f0e63aa89c --- /dev/null +++ b/full_models/tem/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8814bd51b22cb59558c0cd2b98aa272154d8db7fc623d01ba1de8a88c63b561 +size 561079119 diff --git a/full_models/tem/G_100000.pth b/full_models/tem/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2416ce81bb9ddb5f4cfee1ca7d0ca37044db090e --- /dev/null +++ b/full_models/tem/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c51a7d4f2a051c8d45ea7a00ee8cd3155cd95bc72048f547f819e3a32060aa2 +size 436364834 diff --git a/full_models/tem/config.json b/full_models/tem/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tem/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tem/vocab.txt b/full_models/tem/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c064ce05d4ae677bb225ace02ecab92528484ced --- /dev/null +++ b/full_models/tem/vocab.txt @@ -0,0 +1,30 @@ +| +a +k +ɔ +i +t +ŋ +m +ə +r +n +ɛ +ȧ +s +y +e +b +u +o +h +l +p +w +f +- +d +ǝ +g +c + diff --git a/full_models/teo/D_100000.pth b/full_models/teo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..80cbc9047226a5d55a43622921c470b12dd93416 --- /dev/null +++ b/full_models/teo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfd1b87ba3eaf8be7a3074ca4c44dff0c82d3943cf54abd8f29a4111d32a0aa +size 561079015 diff --git a/full_models/teo/G_100000.pth b/full_models/teo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b402c4fb7908fff48a6bad55ce83dc8afbbca304 --- /dev/null +++ b/full_models/teo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f7428e27309185e85b4fc1ff1c34fbb1f1485dbca8412a5fe48ef50918168be +size 436355399 diff --git a/full_models/teo/config.json b/full_models/teo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/teo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/teo/vocab.txt b/full_models/teo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..043fe2d09473d37a114d759cab18bfca0f64720e --- /dev/null +++ b/full_models/teo/vocab.txt @@ -0,0 +1,27 @@ +a +| +i +k +e +o +n +t +u +r +s +l +m +d +y +p +ŋ +b +j +w +c +g +' +- +— +– + diff --git a/full_models/ter/D_100000.pth b/full_models/ter/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d86eec417ff359813995bdf59f5eda520403e8a3 --- /dev/null +++ b/full_models/ter/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92bc67acb6271e43e9fe26ba363b45f82acd47991348f82c8aeeb1eb98f2bc7 +size 561078721 diff --git a/full_models/ter/G_100000.pth b/full_models/ter/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1e0422b888ad15f1950e1acd2dbd3f77182529c1 --- /dev/null +++ b/full_models/ter/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9bf2ebfa6dcb44dc3d6fccd3de2c8c2099f00cd69e55faaed350d1e00d2d63 +size 436380460 diff --git a/full_models/ter/config.json b/full_models/ter/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ter/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ter/vocab.txt b/full_models/ter/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3e05a3e777e2d29fce9607a98691de4811c46c35 --- /dev/null +++ b/full_models/ter/vocab.txt @@ -0,0 +1,39 @@ +| +o +k +e +i +n +a +t +u +p +v +h +y +x +ó +' +m +á +í +ú +s +é +â +r +ê +j +û +d +ô +l +g +— +‍ +z +b +î +f +- + diff --git a/full_models/tes/D_100000.pth b/full_models/tes/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a2ca4a824a1690b1ce1f85124dc4a2bfceb952f4 --- /dev/null +++ b/full_models/tes/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e8268de6581b00b654f61d5719debc2a9eff3b2de7a98eeb4b616ad0a1550d +size 561076026 diff --git a/full_models/tes/G_100000.pth b/full_models/tes/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bc2b432f2691194cff5f466fed22b0e8f848319b --- /dev/null +++ b/full_models/tes/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e8d3e5c1ab4bd5321dc0d9fcc4d3baa6e3e5b82588777c7807e9729b1576d2 +size 436331348 diff --git a/full_models/tes/config.json b/full_models/tes/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tes/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tes/vocab.txt b/full_models/tes/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..11537f40e18c9e7debb6876f857a11fefd3caba7 --- /dev/null +++ b/full_models/tes/vocab.txt @@ -0,0 +1,26 @@ +k +f +a +s +l +r +p +t +- +' +h +j +g +m +c +u +b +_ +n +o +d +y + +i +w +e diff --git a/full_models/tew/D_100000.pth b/full_models/tew/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..af594ac7cd0e0d6a003c5944c2aa3ed431cdd17d --- /dev/null +++ b/full_models/tew/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5214b5063b2aeff9aa7931017e6dab189dfcf97666aff79c5142fbcc2d210e97 +size 561076199 diff --git a/full_models/tew/G_100000.pth b/full_models/tew/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d207fbf8b90ce4f612958ecbaf604223c40c72c7 --- /dev/null +++ b/full_models/tew/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:484e361d59b26b0a4574b8cb7ca60c460f59bd37edcc342480b5d1598d4ec0a7 +size 436383557 diff --git a/full_models/tew/config.json b/full_models/tew/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tew/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tew/vocab.txt b/full_models/tew/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..570b4bcb10cbe8253185a0de37024a7ae975ab37 --- /dev/null +++ b/full_models/tew/vocab.txt @@ -0,0 +1,48 @@ +n +ä +i +ú +é +̂ +z +- +f +k +s +ô +c +ḏ +_ +y +á +î +r +t +o +û +ˀ +g +í +̖ +e +w +v +b +p +́ +j +— +' +d +h +x +ꞌ +ê +q +a +m +l +â + +u +ó diff --git a/full_models/tex/D_100000.pth b/full_models/tex/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b959b080fc6f783a60cee895bf7f97e8b7f4d1be --- /dev/null +++ b/full_models/tex/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8fab4dcb74ef94815a1bc0cddee2283115076d61e4bea6adb3d560fedf696f +size 561078752 diff --git a/full_models/tex/G_100000.pth b/full_models/tex/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c969f5262e20da2afd3b7564c86568b668aa9f00 --- /dev/null +++ b/full_models/tex/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca11783766d433d3a5e320e7d48ac2e6129cdd80f421ef9079b691002ac744c5 +size 436366391 diff --git a/full_models/tex/config.json b/full_models/tex/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tex/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tex/vocab.txt b/full_models/tex/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..43e5de644c55f47dc4309a35f236894a381b6803 --- /dev/null +++ b/full_models/tex/vocab.txt @@ -0,0 +1,32 @@ +r +a +i +e +c +í +s +k +- +t +o +d +̱ +y +j +h +u +_ +l +w + +m +p +n +g +z +ṯ +á +' +ó +b +v diff --git a/full_models/tfr/D_100000.pth b/full_models/tfr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b51f40b56989612618a95541c1114328e66cb182 --- /dev/null +++ b/full_models/tfr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d96100adc4497ac694b5fc79de3ffd7ffdde63cd259671bf9746224d6036344 +size 561078609 diff --git a/full_models/tfr/G_100000.pth b/full_models/tfr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..97b95aecb21e906e68d4101c194eb80773fb420d --- /dev/null +++ b/full_models/tfr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca797c23152306d8860e80e1be68de88dbbde28739263c74bcdf2caf9b603f77 +size 436410423 diff --git a/full_models/tfr/config.json b/full_models/tfr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tfr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tfr/vocab.txt b/full_models/tfr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..646d4f7d43b7ed7943899e6815177a0a04488090 --- /dev/null +++ b/full_models/tfr/vocab.txt @@ -0,0 +1,52 @@ +| +o +a +k +g +j +e +š +n +r +s +i +b +ë +y +w +t +h +p +d +m +ö +ð +u +ä +î +õ +ã +ú +ê +c +z +l +í +é +û +f +ó +á +v +q +ò +ø +è +x +' +à +þ +ü +ï +ñ + diff --git a/full_models/tgj/D_100000.pth b/full_models/tgj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2899c3c40aa289f2c328dedfab60c0a242c65fce --- /dev/null +++ b/full_models/tgj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31fc8a6cc1e1c06207c46b13f14c357189c1d8d0c3de13e55425bf03b07ec459 +size 561079264 diff --git a/full_models/tgj/G_100000.pth b/full_models/tgj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f2749d5aefd08dd6037af6a7c099e9a39d2ad388 --- /dev/null +++ b/full_models/tgj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d6dc812e1bffbb4963f6288878b02fca363e0865c0be6772348997cb8ae6ce +size 436375631 diff --git a/full_models/tgj/config.json b/full_models/tgj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tgj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tgj/vocab.txt b/full_models/tgj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d5011e179139e2741e463f541fe13d3e013cf010 --- /dev/null +++ b/full_models/tgj/vocab.txt @@ -0,0 +1,34 @@ +| +v +n +a +o +g +u +i +k +m +l +r +b +d +w +y +t +s +p +h +j +e +c +— +- +' +0 +4 +6 +1 +f +z +2 + diff --git a/full_models/tgk/D_100000.pth b/full_models/tgk/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e72247c99c6b259d9ec16e7f17b324acf11072d --- /dev/null +++ b/full_models/tgk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d667c577e03adda4ee873a9381b1b21600e2292720355738ecea61d683d2228 +size 561078884 diff --git a/full_models/tgk/G_100000.pth b/full_models/tgk/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..8078ee1a73b29ee3fbf85bda5e28da8daaaac4d0 --- /dev/null +++ b/full_models/tgk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae60843269e0c6067be39ee2984974ae7c6709c5419dd7b06bdd3d5ae2847a4d +size 436389820 diff --git a/full_models/tgk/config.json b/full_models/tgk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tgk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tgk/vocab.txt b/full_models/tgk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4e5c36d7373bf633d13a47b8f959171cde4683a3 --- /dev/null +++ b/full_models/tgk/vocab.txt @@ -0,0 +1,41 @@ +о +ҷ +б +к +я +т + +у +ҳ +ӯ +ч +е +ю +ц +з +м +в +п +ь +— +ф +ш +г +_ +ӣ +ж +э +ё +й +ғ +а +ъ +‐ +р +с +д +и +л +х +қ +н diff --git a/full_models/tgl/D_100000.pth b/full_models/tgl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..de0eba7081550e2f4883564a2c48a4f3b4070d02 --- /dev/null +++ b/full_models/tgl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d175a59f5de54174c8ec8e7bf1c81f8be3743c7674f9975e81e30a7d7242407 +size 561110147 diff --git a/full_models/tgl/G_100000.pth b/full_models/tgl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3146771d41160d889411b95ec4413f5c2b405ba4 --- /dev/null +++ b/full_models/tgl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d7407f398d547b85c30f978e63d82a057883e7533162b21839a25acdcff27f8 +size 436630062 diff --git a/full_models/tgl/config.json b/full_models/tgl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tgl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tgl/vocab.txt b/full_models/tgl/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..731564886683fd535ce9f208a25aa2df50193259 --- /dev/null +++ b/full_models/tgl/vocab.txt @@ -0,0 +1,43 @@ +a +ʼ +x +g +- +o +m +s +i +u +5 +e +0 +z +v +6 +n +' +– +y +2 +f +c +p +r + +j +q +t +9 +b +d +1 +h +w +_ +l +3 +7 +8 +ñ +k +4 diff --git a/full_models/tgo/D_100000.pth b/full_models/tgo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bc2237bdcea8804812a03be5228a59e8b6b3e380 --- /dev/null +++ b/full_models/tgo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4cd1f6701f234110d7feb9a2f0fd2e255dc1f7a18808c021bf352000b9aecce +size 561078623 diff --git a/full_models/tgo/G_100000.pth b/full_models/tgo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5f7c9861644a66088c573a293449d560a109ca6b --- /dev/null +++ b/full_models/tgo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051e0f7a2f6c4205b5d3f3e596a89f960a3931b211ce5a273c82755f8b2e3132 +size 436366763 diff --git a/full_models/tgo/config.json b/full_models/tgo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tgo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tgo/vocab.txt b/full_models/tgo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..13df9bd4c73bfbe016b0d67fe602e93b8b110590 --- /dev/null +++ b/full_models/tgo/vocab.txt @@ -0,0 +1,33 @@ +_ +' +— +b +y +w +2 +f +j +v +6 +1 +- +o +a +ɨ +r +h +ŋ +i +d +m +g +p +l +t +k + +n +0 +e +u +s diff --git a/full_models/tgp/D_100000.pth b/full_models/tgp/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..a46bbc00011bfc7cc83222c4e94d9185c23142e2 --- /dev/null +++ b/full_models/tgp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217bc41c1b447938ba3fc74619361c82f746901ae05888e7e324b3a07afcb686 +size 561078205 diff --git a/full_models/tgp/G_100000.pth b/full_models/tgp/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..29dbd823ca50da1b6b47402bd4cd0e0940685513 --- /dev/null +++ b/full_models/tgp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd6763870dc65c3124a073604692ba7bbf9fe7d75a60c6488e85369a4706b16 +size 436389595 diff --git a/full_models/tgp/config.json b/full_models/tgp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tgp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tgp/vocab.txt b/full_models/tgp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0483fa1bae692b468d1bd8dd7df7edfd20ead307 --- /dev/null +++ b/full_models/tgp/vocab.txt @@ -0,0 +1,43 @@ +| +a +i +o +n +e +r +m +l +t +u +h +s +v +p +̃ +k +g +j +d +b +c +w +1 +y +2 +z +' +4 +3 +6 +f +0 +5 +9 +8 +7 +x +– +— +q +- + diff --git a/full_models/tha/D_100000.pth b/full_models/tha/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..a0dcb722151e5c9e8cbbaaa147608029807ec82d --- /dev/null +++ b/full_models/tha/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb1ec39007f49fd2dfd902b9a784ea87aa6b13bc8ede75d29babecac6bbc82b +size 561079135 diff --git a/full_models/tha/G_100000.pth b/full_models/tha/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..41344b27257b1cfe2ae98771baf7f7bab4bcdeaa --- /dev/null +++ b/full_models/tha/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df7230675689c30a3b00fc2313714539774da4ab4a613b99a03a2e54b4e4e5e9 +size 436459620 diff --git a/full_models/tha/config.json b/full_models/tha/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tha/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tha/vocab.txt b/full_models/tha/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..11de8465ce535569b832e707dd7174fc16795d4e --- /dev/null +++ b/full_models/tha/vocab.txt @@ -0,0 +1,71 @@ +า +น +่ +ร +เ +้ +อ +ง +ก +ว +ะ +ั +ม +ท +พ +ย +ล +จ +ี +ค +ต +ด +ห +ข +ิ +แ +ส +บ +ป +ไ +ู +ใ +็ +ื +์ +ช +ุ +ึ +ํ +โ +ผ +ถ +ญ +ซ +ธ +ศ +ณ +ษ +ฟ +ภ +ฉ +ฝ +ฐ +ฤ +ฏ +ฮ +ฆ +๋ +ฎ +' +0 +๊ +ฑ +1 +4 +2 +- +ฬ +ฒ +ฌ + diff --git a/full_models/thk/D_100000.pth b/full_models/thk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..856f1d9a2aaf9276025782dec0b8399e8c219a3b --- /dev/null +++ b/full_models/thk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62729db36acabb5ffddd4edc07903f223d9fd325718f23bae348220b81d0e1bf +size 561078614 diff --git a/full_models/thk/G_100000.pth b/full_models/thk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f021f3596bc88ccad474f96cfb5e1d70c4107b75 --- /dev/null +++ b/full_models/thk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af4e5031920e1987e41d5aa26b8062e90075285f942631790c9ef716fa4ddedc +size 436355793 diff --git a/full_models/thk/config.json b/full_models/thk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/thk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/thk/vocab.txt b/full_models/thk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b1a41cd543f4e09df9e7dce741ca0a292c775ab5 --- /dev/null +++ b/full_models/thk/vocab.txt @@ -0,0 +1,28 @@ +a +| +n +û +î +r +i +t +e +k +g +b +m +w +u +o +h +y +d +s +' +c +j +p +- +f +l + diff --git a/full_models/thl/D_100000.pth b/full_models/thl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..69e8a74cb3a8b9fcd0f4b7b6c3be35ff4e58a42c --- /dev/null +++ b/full_models/thl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9543e978b80259195d5484666febc4bdbbd48eb3676d2123fc01e41ae47178df +size 561079239 diff --git a/full_models/thl/G_100000.pth b/full_models/thl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ee4e7b021d8e9bb2501ff2e9a67027120e07ccb --- /dev/null +++ b/full_models/thl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8eb125cf4d10fa9c7a9f2fda8172c8d7cf0bcc39aadc2062d0a3d489f0d2d5 +size 436442644 diff --git a/full_models/thl/config.json b/full_models/thl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/thl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/thl/vocab.txt b/full_models/thl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c697a84cf52e2b73fdf3019e41f664009eba19e7 --- /dev/null +++ b/full_models/thl/vocab.txt @@ -0,0 +1,64 @@ +ृ +क +ड +ऊ +इ +् +ल +ठ +ो +ङ +ञ +व +ि +ऐ +ओ +झ +ँ +ढ +ः +छ +ऋ +ू +ब + +ौ +प +' +ध +ु +ण +थ +र +श +ष +_ +े +फ +ख +ई +त +ऽ +आ +‍ +स +ज +द +उ +म +- +य +ी +ग +ा +घ +ए +औ +ट +भ +ै +ह +अ +न +च +ं diff --git a/full_models/tih/D_100000.pth b/full_models/tih/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ff39d48fe97aa5d95026fd7f780ba99ffbfb650b --- /dev/null +++ b/full_models/tih/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd59f050bada827fd234289436344a618653c4cdf4b7a689ff69c1e4a8ca2976 +size 561078978 diff --git a/full_models/tih/G_100000.pth b/full_models/tih/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..41605ee183040dc89abafbc3d88c5a87b41a3167 --- /dev/null +++ b/full_models/tih/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b68f10bd44b5d867c8d4c3442be7f705759e250f63da502721da17a709321c0 +size 436367169 diff --git a/full_models/tih/config.json b/full_models/tih/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tih/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tih/vocab.txt b/full_models/tih/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e4cd10cfd441b2fc0cfb0189dad29603835b76f2 --- /dev/null +++ b/full_models/tih/vocab.txt @@ -0,0 +1,32 @@ +t +u +4 +o +m +r +e +z +l +d +w +y +j +b +a +– +g +_ +n +p +s +k +- +i + +h +' +0 +1 +6 +c +2 diff --git a/full_models/tik/D_100000.pth b/full_models/tik/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f27b24ed9bdd515b9bd166141f81ff9d389d2d49 --- /dev/null +++ b/full_models/tik/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2442492fbe24ad697749158b0c7ea6e2de58ba8802fee951133c177b0be953d6 +size 561078624 diff --git a/full_models/tik/G_100000.pth b/full_models/tik/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c0799e761195a2bb618dd8fd4d10fdc10b4714cf --- /dev/null +++ b/full_models/tik/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05a78559eed0a4b1d28012f7f37875b3ee5c5827c1f20ac4d703cc28535671f1 +size 436412854 diff --git a/full_models/tik/config.json b/full_models/tik/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tik/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tik/vocab.txt b/full_models/tik/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..384818bfeba2aaa938c8826f8b73a4d826003149 --- /dev/null +++ b/full_models/tik/vocab.txt @@ -0,0 +1,53 @@ +| +n +ɛ +i +m +w +y +ɓ +̀ +l +k +s +ʼ +u +a +ì +e +t +à +b +æ +ù +ɔ +o +h +z +c +f +̌ +ǹ +d +ɗ +ŋ +v +ò +g +p +ǎ +è +j +̂ +r +â +- +ǐ +î +ê +ǔ +û +ě +ǒ +ô + diff --git a/full_models/tir/D_100000.pth b/full_models/tir/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9902f7a172c0dfcd50cef7b7b81c2e128a3a163a --- /dev/null +++ b/full_models/tir/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c654c87911d1b5e796c8320f934e5362c6f8cbac1333350327012b79b86b1791 +size 561078581 diff --git a/full_models/tir/G_100000.pth b/full_models/tir/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..0f7ab51d714061bebe7de25ad3c19e0354e0f90a --- /dev/null +++ b/full_models/tir/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8db9de59b6e0f6efd87e25c6da7e381268d05b4f71b1f57ee2374236c135fa5 +size 436353053 diff --git a/full_models/tir/config.json b/full_models/tir/config.json new file mode 100644 index 0000000000000000000000000000000000000000..993d1dedb1d0c8e820b98f9e2f019ff166327038 --- /dev/null +++ b/full_models/tir/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.uroman", + "validation_files": "dev.uroman", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tir/vocab.txt b/full_models/tir/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..29be0f20b63dddfab221c774186a4475ac3cd7f1 --- /dev/null +++ b/full_models/tir/vocab.txt @@ -0,0 +1,27 @@ + +- +a +b +c +d +e +f +g +h +i +j +k +l +m +n +o +p +q +r +s +t +u +w +x +y +z diff --git a/full_models/tkr/D_100000.pth b/full_models/tkr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..74094b2170afba6cff1f201388677626ca188637 --- /dev/null +++ b/full_models/tkr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed467d749881267f299c80b4c7428ea85c47da2c9c2a90481d58c1e8e87ed6fc +size 561076072 diff --git a/full_models/tkr/G_100000.pth b/full_models/tkr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..247bb0b0f485d4da62aee312721676ec356b44cc --- /dev/null +++ b/full_models/tkr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d804197675f34cf99a1569ab5c6fca338e3f223755637d92f16f1b68344304be +size 436357289 diff --git a/full_models/tkr/config.json b/full_models/tkr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tkr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tkr/vocab.txt b/full_models/tkr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c0675d44f367dbc172e76a71389e6c33569d56a2 --- /dev/null +++ b/full_models/tkr/vocab.txt @@ -0,0 +1,37 @@ +| +a +e +n +' +i +ı +y +l +h +s +u +m +k +q +b +r +g +x +ş +d +v +ə +o +t +ç +c +ğ +p +z +– +ü +ö +- +̇ +f + diff --git a/full_models/tlb/D_100000.pth b/full_models/tlb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..22cde23f42538a8dbdaef3dcf74972ec7403280c --- /dev/null +++ b/full_models/tlb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48974137e5faf32456074fadabf7cb859c0d60ea927dfb675c7ccc90563d2f3b +size 561078887 diff --git a/full_models/tlb/G_100000.pth b/full_models/tlb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7fad2875221a9be80db02c237690c6c9da8aa142 --- /dev/null +++ b/full_models/tlb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70fe322dae94c85e194c8c2d4ece8017df86f4ffe43baa485345ab181469c316 +size 436391504 diff --git a/full_models/tlb/config.json b/full_models/tlb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tlb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tlb/vocab.txt b/full_models/tlb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..2664f396df63357419094413b2befdd284cbe22b --- /dev/null +++ b/full_models/tlb/vocab.txt @@ -0,0 +1,43 @@ +g +- +5 +y +z +a +l +ö +2 +w +n +_ +u +ï +ë +c +o + +d +e +i +6 +m +ü +9 +0 +̄ +v +f +ä +b +p +7 +1 +4 +r +s +3 +j +h +t +' +k diff --git a/full_models/tlj/D_100000.pth b/full_models/tlj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6db5d7149a46b748c5585127a3e8019af795c305 --- /dev/null +++ b/full_models/tlj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beaa4fdf0ae5b30e8fcea1969be527f0e61e9f908af8c45544559089d544ff85 +size 561079000 diff --git a/full_models/tlj/G_100000.pth b/full_models/tlj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d48b4fcb44d87f03c5ca2812e580e81ce01afc0d --- /dev/null +++ b/full_models/tlj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d9a126dfe504fe5e54742b3573658ed6329dac3a610eebbb74f3162fa5c3bc +size 436362055 diff --git a/full_models/tlj/config.json b/full_models/tlj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tlj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tlj/vocab.txt b/full_models/tlj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..85f0fceaa7221e45708b78818c2d55f32ff6a2c0 --- /dev/null +++ b/full_models/tlj/vocab.txt @@ -0,0 +1,30 @@ +y +c +w +d + +n +s +- +̱ +k +ʼ +j +_ +a +l +o +t +f +5 +m +' +b +i +h +g +u +p +v +e +6 diff --git a/full_models/tly/D_100000.pth b/full_models/tly/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2f434b0a4d9d911a6af3a273665973e2313663b8 --- /dev/null +++ b/full_models/tly/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236f46c9b209f7c92ec46d82beb025cacf7ff05d56ab425eaac462858b524d36 +size 561078995 diff --git a/full_models/tly/G_100000.pth b/full_models/tly/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a55e3f211b6b613cae52c5ca9eb43eb0101c481 --- /dev/null +++ b/full_models/tly/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ff6c11c4eefdf28a0f5efbaf00092e8766952f111f5ac674f6fb4d20cf8930 +size 436386787 diff --git a/full_models/tly/config.json b/full_models/tly/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tly/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tly/vocab.txt b/full_models/tly/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..004e24359715b1dbc255c6eb7d4ea65137b89b0f --- /dev/null +++ b/full_models/tly/vocab.txt @@ -0,0 +1,40 @@ +t +x +a +ğ +m +0 +i +5 +s +q +h +ə +r +v +p + +4 +d +n +y +– +c +z +ş +- +k +_ +b +o +u +e +l +1 +f +6 +2 +j +ı +ç +̇ diff --git a/full_models/tmc/D_100000.pth b/full_models/tmc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d5dfabe30ce0baae5f5d33f4ae2032650adba6d9 --- /dev/null +++ b/full_models/tmc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a37517fbbac3bf2454c27a2fd7a30edd49790897bfaf73b4bfd81310340669f6 +size 561078748 diff --git a/full_models/tmc/G_100000.pth b/full_models/tmc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed22be74cfaf2c8ad27b1928ede4c568384c90cc --- /dev/null +++ b/full_models/tmc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be7ca67b244f36593f14f39229d19cdd4714dbc1b775649c97d0886b155d4c86 +size 436371382 diff --git a/full_models/tmc/config.json b/full_models/tmc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tmc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tmc/vocab.txt b/full_models/tmc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a95dc2c85348fb2336fdfea7ed4b2c7567b87ffc --- /dev/null +++ b/full_models/tmc/vocab.txt @@ -0,0 +1,34 @@ +n +l +b +o +i +y +ɔ +u +ɨ +- +ɛ +꞊ +ɓ +r +_ + +a +́ +ɗ +t +h +k +j +m +̰ +e +ᵻ +g +' +ḭ +w +d +s +p diff --git a/full_models/tmf/D_100000.pth b/full_models/tmf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ef55ef86c26d9dac1b8d8289bec78b448b63ae5 --- /dev/null +++ b/full_models/tmf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:658c4a8d20aacbf58eb4fcf3356961fba1c071c9cf281fed6263b1da51083764 +size 561077828 diff --git a/full_models/tmf/G_100000.pth b/full_models/tmf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8abb34153b310c2810527300aa2b243a0ac34688 --- /dev/null +++ b/full_models/tmf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcbd9232df76d5d0958de975a55e4d936f36e90df4a263f9dd7ff68378289da6 +size 436373635 diff --git a/full_models/tmf/config.json b/full_models/tmf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tmf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tmf/vocab.txt b/full_models/tmf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..44be349851069370094f7baa021517c5fe8a0346 --- /dev/null +++ b/full_models/tmf/vocab.txt @@ -0,0 +1,40 @@ +a +| +k +e +n +m +l +h +o +t +p +i +s +' +g +v +q +r +u +j +— +c +d +b +f +y +0 +1 +z +2 +7 +4 +5 +x +3 +6 +9 +8 +ñ + diff --git a/full_models/tna/D_100000.pth b/full_models/tna/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7d9d24e8fca82efb4dfe7570f8fa56546d15b120 --- /dev/null +++ b/full_models/tna/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7012f1872cc60a7248250b9f047ada7475563265a0f09bf97b4ce14bc0d4eebe +size 561078849 diff --git a/full_models/tna/G_100000.pth b/full_models/tna/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..403f26e853a5d7bc0f5ed9fb15812e53ace1efd9 --- /dev/null +++ b/full_models/tna/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c072222c05bc02a28b9171bc9126712a89e444628cf34aaf50993c636ab1989 +size 436377652 diff --git a/full_models/tna/config.json b/full_models/tna/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tna/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tna/vocab.txt b/full_models/tna/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6b70329240912e7345c020dea6e469922ad7362b --- /dev/null +++ b/full_models/tna/vocab.txt @@ -0,0 +1,37 @@ +i +h +o +g +m +p +— +z +' +r +s +e +f +y +d +x +ñ + +í +n +k +t +q +_ +u +j +l +á +ó +0 +8 +v +a +b +ú +é +c diff --git a/full_models/tng/D_100000.pth b/full_models/tng/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2632aaf9d26b4ff1005751b3e93e2d5e05cc97dd --- /dev/null +++ b/full_models/tng/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf0c5e6eb6b3d90affd53eb5f2ff2bc949f766de192465a60e9772b50eed09a +size 561079263 diff --git a/full_models/tng/G_100000.pth b/full_models/tng/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a463a8b0f4bafc8f1d2e18473324e632a6615400 --- /dev/null +++ b/full_models/tng/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1e785773417cd95e57d7ea628a0c3d4ffafaa5e415deae6b29e08ac322f411 +size 436378003 diff --git a/full_models/tng/config.json b/full_models/tng/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tng/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tng/vocab.txt b/full_models/tng/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ce58e201459d31b60f2df5703d0c6b5e2e0cf0f9 --- /dev/null +++ b/full_models/tng/vocab.txt @@ -0,0 +1,36 @@ +u +b +h +û +î +r +a +n +j +s +ÿ +v +g +y +â +ç +c +ô +m +o +ë + +- +_ +ê +d +ū +e +k +é +w +l +i +' +p +t diff --git a/full_models/tnk/D_100000.pth b/full_models/tnk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..61da4920153be04e7eca71ed89e3574a19aa4a5c --- /dev/null +++ b/full_models/tnk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52bd936780c3508f42f3597adf2445dbf4c657a502af203346a849cf990ce833 +size 561078715 diff --git a/full_models/tnk/G_100000.pth b/full_models/tnk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2a1543bf1d9e73d5863da0052b9bb2382135a4d1 --- /dev/null +++ b/full_models/tnk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14eab2fe8ee42ffc81d8f6ca5fafbe58baa8dbf4f0dfbdbc7f98100135dc0c98 +size 436366681 diff --git a/full_models/tnk/config.json b/full_models/tnk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tnk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tnk/vocab.txt b/full_models/tnk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b95e65f6f3e1c2cdbea160fead19eb6175bf2d18 --- /dev/null +++ b/full_models/tnk/vocab.txt @@ -0,0 +1,33 @@ +0 +d +n +b +s +r +w +ə +u +a +k +ɨ +ɡ +v +y +l + +m +' +4 +t +3 +_ +j +ǝ +- +e +h +o +f +i +p +g diff --git a/full_models/tnn/D_100000.pth b/full_models/tnn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0a0289fac99a4a06743970d51ea78cc087063997 --- /dev/null +++ b/full_models/tnn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f40ee0ff5ee91d53aeef9f32a193a7ff8173deb807eb973c3853df5e4fd594 +size 561078706 diff --git a/full_models/tnn/G_100000.pth b/full_models/tnn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fd232345f4d4420f11ae4edc865ce12de41f8f0c --- /dev/null +++ b/full_models/tnn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac08b165b7b984d88b4971b4b38bd25b1ea76fc80ea7418285426df7c6e95346 +size 436353081 diff --git a/full_models/tnn/config.json b/full_models/tnn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tnn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tnn/vocab.txt b/full_models/tnn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e27839c59d6c19f57e4bc4843f840e00d3413afa --- /dev/null +++ b/full_models/tnn/vocab.txt @@ -0,0 +1,27 @@ +ə +l +h +v +_ +s +m +o +n +g +i +ɨ +' +b +r +- +e +k +a +t +f +u +w +j + +d +p diff --git a/full_models/tnp/D_100000.pth b/full_models/tnp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..49bbb76a65c1d99c537ecd8fbe2e0f3a063606f0 --- /dev/null +++ b/full_models/tnp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:353eccbd5a4d7d1c48f1101ef94c16a97ed9f8e98edf6fc0ca334027a0e2210f +size 561076030 diff --git a/full_models/tnp/G_100000.pth b/full_models/tnp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c71946df280cc59209e520732564bac264d9f149 --- /dev/null +++ b/full_models/tnp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d3585cdd76281865b5c2c26e4d2450d0af84324da1843bece6c6eced0113a4 +size 436336049 diff --git a/full_models/tnp/config.json b/full_models/tnp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tnp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tnp/vocab.txt b/full_models/tnp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..02a738b60803652e472ff0c200437b5afaa45473 --- /dev/null +++ b/full_models/tnp/vocab.txt @@ -0,0 +1,28 @@ +_ +o +d +n +ə +u +e +h +m +r +g +f +ɨ +t +i +b +v +k +s +' +l + +w +a +— +- +j +p diff --git a/full_models/tnr/D_100000.pth b/full_models/tnr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..80676ca5a3ce980a0e48f312fbb7d2dbb64fa517 --- /dev/null +++ b/full_models/tnr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631169d6681b7115cfe842342da4ba0f97333262fb90cc41aa4046fad72d1cad +size 561078503 diff --git a/full_models/tnr/G_100000.pth b/full_models/tnr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a46bc3e694f28cb23e663912ce8c88e884672a8f --- /dev/null +++ b/full_models/tnr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee97ed6bf65526b87e7efbc50478bc5d71483067150b67daa166efb084a8e886 +size 436375860 diff --git a/full_models/tnr/config.json b/full_models/tnr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tnr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tnr/vocab.txt b/full_models/tnr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d514728e50e1d5158b9c7c8301be411bdf63f79e --- /dev/null +++ b/full_models/tnr/vocab.txt @@ -0,0 +1,37 @@ +ó +h +j +_ +t +a +u +n +é +c +i +ŝ +ü +r +p +m +d +ƴ +s +ñ +g +ë +e +k +– +y +ɓ +o + +f +ɗ +— +ŋ +b +w +- +l diff --git a/full_models/tnt/D_100000.pth b/full_models/tnt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6f13561562ecc97272c6e4c3768ba796c864f8ee --- /dev/null +++ b/full_models/tnt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92f65e597353ff896244b08e753e41b9af6e562e912f310c7d732971b69d8d72 +size 561078877 diff --git a/full_models/tnt/G_100000.pth b/full_models/tnt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f3a0182329fbbaa588a25b501c7110c9641c4d12 --- /dev/null +++ b/full_models/tnt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1338d2a03d031ef9da96e847f8c88440bf3b016927c354a3ed67951024e942e3 +size 436360917 diff --git a/full_models/tnt/config.json b/full_models/tnt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tnt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tnt/vocab.txt b/full_models/tnt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7777019f4d72db119a50746854bb00a22ca33844 --- /dev/null +++ b/full_models/tnt/vocab.txt @@ -0,0 +1,29 @@ +' +y +z +w +u +j +t +d +i +f +h +m + +é +_ +p +r +n +k +- +e +c +a +b +o +l +ó +g +s diff --git a/full_models/tob/D_100000.pth b/full_models/tob/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0f1c52b204ca37e6c4d4ef39477988590a15b948 --- /dev/null +++ b/full_models/tob/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc5f62ea50a8f0828a6289b791daad3e7b0f3db21093b2b183f34f7c1a3b2ef +size 561078247 diff --git a/full_models/tob/G_100000.pth b/full_models/tob/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a9b2bc14c6f4c76584cb803c7d70f2adec08c919 --- /dev/null +++ b/full_models/tob/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9cb8c7a5984703cfaf39a2da1892efe760ddd49b692029a09f01c347120115 +size 436375843 diff --git a/full_models/tob/config.json b/full_models/tob/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tob/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tob/vocab.txt b/full_models/tob/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..43bbd52aef1d159703320a4505f897cd84625435 --- /dev/null +++ b/full_models/tob/vocab.txt @@ -0,0 +1,37 @@ +m +y +s +' +r +q +j +f +_ +i +a +c +k + +b +ú +á +h +t +í +e +o +x +ó +ñ +p +d +– +l +n +z +v +ỹ +é +g +u +- diff --git a/full_models/toc/D_100000.pth b/full_models/toc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..313beb920f34b07521370c864f5528c434287e05 --- /dev/null +++ b/full_models/toc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e14b0ab2a4384ed0f831c5c6380a07864eeb5d53b7d661a1ce58d06587d815 +size 561076169 diff --git a/full_models/toc/G_100000.pth b/full_models/toc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..88ba1f22fd0e7a3e2195a67b87add8f554fc0aed --- /dev/null +++ b/full_models/toc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6515fbf14e5d20f9c1656cabafae01901bb4f83a693e14911bbe43880beb9b +size 436357937 diff --git a/full_models/toc/config.json b/full_models/toc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/toc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/toc/vocab.txt b/full_models/toc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bef210f33cc390784f17ae49d1aec2dbf6b6ad01 --- /dev/null +++ b/full_models/toc/vocab.txt @@ -0,0 +1,37 @@ +a +| +̲ +n +u +i +t +c +l +h +á +x +m +p +s +k +y +o +q +e +r +í +ú +j +z +d +é +b +— +g +ó +f +v +' +ñ +w + diff --git a/full_models/toh/D_100000.pth b/full_models/toh/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dcf180d4fcc5554808216cf7b7484e112df31a7f --- /dev/null +++ b/full_models/toh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71749685c6069918e952137bbd6a2a673a65572d65b3a0f38fa52b796e71679 +size 561079109 diff --git a/full_models/toh/G_100000.pth b/full_models/toh/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..457b7789e4e03b4fd22395f78572909fe9187fa1 --- /dev/null +++ b/full_models/toh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15cd720c2afd0d0696082a6eb0e7ff50c324950f6d38c5c6aea329e60f556e28 +size 436367907 diff --git a/full_models/toh/config.json b/full_models/toh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/toh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/toh/vocab.txt b/full_models/toh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a29013bad3fc1fb3ceed1c2ee3099e74105b8a2e --- /dev/null +++ b/full_models/toh/vocab.txt @@ -0,0 +1,32 @@ +| +a +i +u +n +g +e +h +o +l +m +y +d +v +s +k +w +b +t +r +z +p +f +j +' +- +x +9 +– +1 +5 + diff --git a/full_models/tom/D_100000.pth b/full_models/tom/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c0c91fdd413a8add50ee2db9f9a421d7dc901ef9 --- /dev/null +++ b/full_models/tom/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a5689b075ab21f45544caeb704f8e0b2864963e76a3b8def4ecfe0b7f973da +size 561078996 diff --git a/full_models/tom/G_100000.pth b/full_models/tom/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..68d8051b436fa7870600f6c2a4eea35cb973347b --- /dev/null +++ b/full_models/tom/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0debb0e36b19a9ee5a72e27900956b018b9eebe2335482a9da802b722f23d717 +size 436356040 diff --git a/full_models/tom/config.json b/full_models/tom/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tom/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tom/vocab.txt b/full_models/tom/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..be902edfd3be491a9bad238da134fbb3fdb0b884 --- /dev/null +++ b/full_models/tom/vocab.txt @@ -0,0 +1,28 @@ +m +g +y +a +k +p +l +f +' +h +r +c +w +- +t +_ +d +b +é +z +e +i +n + +o +s +u +j diff --git a/full_models/tos/D_100000.pth b/full_models/tos/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..10901e6a805612f7d411950c0d025174ef007e7d --- /dev/null +++ b/full_models/tos/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0980c119bff5a12726cebfd392a1fa79092f7bb1378ca8ed0da51016fca34e5b +size 561076171 diff --git a/full_models/tos/G_100000.pth b/full_models/tos/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f1adade3a1bc45a579298f8d1c63fbc5be6c1aa9 --- /dev/null +++ b/full_models/tos/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9faf0bfd6440322a4020c348c66faf41365e8a343eca11e51753c7c11cbbd2 +size 436364885 diff --git a/full_models/tos/config.json b/full_models/tos/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tos/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tos/vocab.txt b/full_models/tos/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f56171027df07554b0eaffeae0947179f26ce33c --- /dev/null +++ b/full_models/tos/vocab.txt @@ -0,0 +1,40 @@ +a +̱ +| +i +u +n +t +c +h +l +x +m +k +p +á +s +y +o +q +í +j +ú +z +e +- +d +r +ó +b +g +é +f +v +' +ñ +0 +ï +ì +1 + diff --git a/full_models/tpi/D_100000.pth b/full_models/tpi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9d99937a81bf4b611023747f3b7a4dc13ccb4595 --- /dev/null +++ b/full_models/tpi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:504523d81f5a96cb8df2517b287c0b89b913e52a536ce21e16906d027dfc5de0 +size 561078503 diff --git a/full_models/tpi/G_100000.pth b/full_models/tpi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1ee6bd66a66cc88c7b1ff07fa3bd6b08181c3336 --- /dev/null +++ b/full_models/tpi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cefa302086a186aaf6991fed645a0851e450da782f6a46d0185dadcc4fdcc56 +size 436375983 diff --git a/full_models/tpi/config.json b/full_models/tpi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tpi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tpi/vocab.txt b/full_models/tpi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cdbe3de9ceb75a20339078946bee484ff6a70bea --- /dev/null +++ b/full_models/tpi/vocab.txt @@ -0,0 +1,37 @@ +' +l +_ +6 +o +e +s +7 +r +f +n +1 +u +4 +q +8 +k +- +i +2 +j +v +h +w +p +0 +9 +t +d +5 +m +y +g +a + +3 +b diff --git a/full_models/tpm/D_100000.pth b/full_models/tpm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5d6f4cca1f1c5dd57fbdaa2e79cd46a91a719899 --- /dev/null +++ b/full_models/tpm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:943b0defecdbe253d8df7b779a63db20992d03ff0b98d3c046db549598a13515 +size 561078833 diff --git a/full_models/tpm/G_100000.pth b/full_models/tpm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3ba7b92546b5b13a883b12df6ca2d918ac4f69cd --- /dev/null +++ b/full_models/tpm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f3d1292a6020c535ee262fd0a0e44784917c6d9493d72ab6b3d054df1af24b +size 436363075 diff --git a/full_models/tpm/config.json b/full_models/tpm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tpm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tpm/vocab.txt b/full_models/tpm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c498a0844868242d866252ab633d5e80f909b42e --- /dev/null +++ b/full_models/tpm/vocab.txt @@ -0,0 +1,30 @@ +| +a +i +n +u +m +o +k +ɛ +s +t +b +y +l +e +h +w +d +ɔ +r +f +g +c +ŋ +p +z +v +j +' + diff --git a/full_models/tpp/D_100000.pth b/full_models/tpp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e856fc2813de3b034c03ae875dbdcfe2817b1c49 --- /dev/null +++ b/full_models/tpp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adfc0444b0c979b80d5e11e52e82a26e305a6b0b88392a479b32f3e4089b9006 +size 561078617 diff --git a/full_models/tpp/G_100000.pth b/full_models/tpp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d3f0ea05c2b46442ac172ad4c191bb992544b375 --- /dev/null +++ b/full_models/tpp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3cccb12d01c0e950a8105b9363d632c01da3d6adc136a1c0f246294ff29db0c +size 436394441 diff --git a/full_models/tpp/config.json b/full_models/tpp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tpp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tpp/vocab.txt b/full_models/tpp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6308f160bd0563f351365c2470fe911cc6bef7e5 --- /dev/null +++ b/full_models/tpp/vocab.txt @@ -0,0 +1,45 @@ +a +| +i +n +t +h +' +l +u +k +c +y +s +x +j +m +p +w +o +e +r +d +b +ú +— +g +é +f +ó +í +v +z +á +q +0 +4 +́ +1 +6 +ñ +` +2 +- +3 + diff --git a/full_models/tpt/D_100000.pth b/full_models/tpt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a05ad7777de5a56672a1a378d7d392a6b29fb93e --- /dev/null +++ b/full_models/tpt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05bde876e1b29602fe25e880627661ecb12da38825ab6a03254289ba073d0f98 +size 561078634 diff --git a/full_models/tpt/G_100000.pth b/full_models/tpt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f43af371dd3807ef786fe21dc284901de3f55d03 --- /dev/null +++ b/full_models/tpt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21e9a7ae480151343cc46679252386f69c1502b83d5e873df864e733afaaa9f5 +size 436385112 diff --git a/full_models/tpt/config.json b/full_models/tpt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tpt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tpt/vocab.txt b/full_models/tpt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f65e8ee77c79e14ff92d57baf880d0b4fec2858c --- /dev/null +++ b/full_models/tpt/vocab.txt @@ -0,0 +1,41 @@ +a +| +n +i +t +u +k +l +ʼ +h +y +c +s +x +j +o +p +m +q +v +e +r +d +ú +b +— +í +é +g +f +ó +á +z +0 +4 +1 +3 +ñ +2 +- + diff --git a/full_models/trc/D_100000.pth b/full_models/trc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a39c35c995007b423e8c18211a404de7b0d7f005 --- /dev/null +++ b/full_models/trc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6fe2755527e63b0e14b0fd6d02a69b28a479409a32286b23b783723280a0bde +size 561076076 diff --git a/full_models/trc/G_100000.pth b/full_models/trc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..66f5023aeea6d53d150b5bc6cc47a24b25b60096 --- /dev/null +++ b/full_models/trc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7332f926b881f4ba5ab35ee2f7025129080444d6664188bb0b4f13d3d34f3b14 +size 436366913 diff --git a/full_models/trc/config.json b/full_models/trc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/trc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/trc/vocab.txt b/full_models/trc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b6c6d028eebe1db7053e6d91265d93a42d3e2bab --- /dev/null +++ b/full_models/trc/vocab.txt @@ -0,0 +1,41 @@ +n +r +o +h +ó +l +á +ô +y +e +d +ú +f +ꞌ +j +â +z +ñ +m +b +‐ +q +í +é +ê +i +x +û +p +ü +s +v +a +_ +̱ + +t +c +k +u +g diff --git a/full_models/tri/D_100000.pth b/full_models/tri/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a29911c8d8c6959a6e6519d938b4c1043ed6aff7 --- /dev/null +++ b/full_models/tri/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d36011febcfde353cd86d209377d0bdf7b7e869afc82b96dd845aba5d6db124 +size 561079016 diff --git a/full_models/tri/G_100000.pth b/full_models/tri/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..65c929e1f37608463836c3c7ef6d0be67331f074 --- /dev/null +++ b/full_models/tri/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74b81dddaf981923b5952ab011a6f3f4e5465de58d1ac9e30970e2a4a546eed +size 436383845 diff --git a/full_models/tri/config.json b/full_models/tri/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tri/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tri/vocab.txt b/full_models/tri/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a949c65b3b58ce466a9b96ef177dd4a0125bedf3 --- /dev/null +++ b/full_models/tri/vocab.txt @@ -0,0 +1,38 @@ +| +a +n +e +ë +o +t +i +r +k +m +p +ï +h +j +w +u +s +' +ʻ +- +0 +1 +2 +3 +7 +4 +5 +6 +9 +8 +l +z +y +g +f +ƒ + diff --git a/full_models/trn/D_100000.pth b/full_models/trn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..319cef9d029328495099fe29d56a361f115d6651 --- /dev/null +++ b/full_models/trn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:931b36571526a63d7e2a68776c9085f75aada5e678b677e1d46db6f7cffc3683 +size 561078831 diff --git a/full_models/trn/G_100000.pth b/full_models/trn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bfabf4daf732a6558e5b93b229f0d9ef29e2b37f --- /dev/null +++ b/full_models/trn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eec3a6f495e8764531d36ab870c0359e1bcb2d941a697849f3d698f2a7ed631 +size 436379315 diff --git a/full_models/trn/config.json b/full_models/trn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/trn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/trn/vocab.txt b/full_models/trn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..76c68a10c941d9fdecaeceaa0a983cd84be5dd52 --- /dev/null +++ b/full_models/trn/vocab.txt @@ -0,0 +1,37 @@ +_ +z +ñ +á +x +g +c +e +o +v +y +— +k +i +p +l +f +a +s +ó +u +ú +t +d +1 +n +q + +é +h +j +í +‐ +b +' +m +r diff --git a/full_models/trs/D_100000.pth b/full_models/trs/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ad5a310148765b48bf54089d4dea5672847d9bc0 --- /dev/null +++ b/full_models/trs/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d4dd8fd9e02faa3064918afc636a203c4adf528f1297ea9d57eb2dbefad679f +size 561078105 diff --git a/full_models/trs/G_100000.pth b/full_models/trs/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a3fedb6fe4fabf48b05e4323f926c3b0323296f0 --- /dev/null +++ b/full_models/trs/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1f9a983bc169706e4381317be35fd5e82aa3bfa201dffbbc510d9fa50b0258 +size 436412484 diff --git a/full_models/trs/config.json b/full_models/trs/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/trs/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/trs/vocab.txt b/full_models/trs/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0ab0cc053766d5e6a786e11df2e59b85438de0a7 --- /dev/null +++ b/full_models/trs/vocab.txt @@ -0,0 +1,53 @@ +n +p +r +c +ï +' +î +̀ +ó + +ú +- +q +l +k +e +_ +d +h +ë +u +ò +û +ì +z +b +x +à +ù +s +í +o +̱ +v +t +̂ +g +ḯ +è +á +j +ñ +— +́ +m +i +â +y +f +é +ô +a +ê diff --git a/full_models/tso/D_100000.pth b/full_models/tso/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dce68adec9388237920173769aaad540fe73e169 --- /dev/null +++ b/full_models/tso/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e474aa1cf7a020b59e60242bcce50198066d5aa45555b58c2bc6149083b0f5 +size 561079013 diff --git a/full_models/tso/G_100000.pth b/full_models/tso/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..662ccc3d047aa45fa81728f794895ee560c15f16 --- /dev/null +++ b/full_models/tso/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f71d503b54491338edc2e2e63d0273dabcc213f1910467445af3c2ac5a9c225b +size 436363581 diff --git a/full_models/tso/config.json b/full_models/tso/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tso/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tso/vocab.txt b/full_models/tso/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..6f966e02009751d79cd048fff42bbf177f7849a0 --- /dev/null +++ b/full_models/tso/vocab.txt @@ -0,0 +1,30 @@ +h +z +w +s +' +l +r +m +o +p +v +k +j +g +n +d +i +t +- +f +a +x +b +y +c +_ + +e +u +q diff --git a/full_models/tsz/D_100000.pth b/full_models/tsz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..edaf2bc04a83fd93e3e6a0868046557c6d91b55b --- /dev/null +++ b/full_models/tsz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80a25d7fac465fb379a3afe2bd81bdb92b0401811b450c9ca4316e240349c6fa +size 561078373 diff --git a/full_models/tsz/G_100000.pth b/full_models/tsz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1d5e82755e9016c21f441ada42203e896caff3a0 --- /dev/null +++ b/full_models/tsz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c03ce593fd1d9b1635ee363f0bb7a00f27c33afd1806d0ed89391eaac3c4008 +size 436373792 diff --git a/full_models/tsz/config.json b/full_models/tsz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tsz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tsz/vocab.txt b/full_models/tsz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..96165c316a2f1f4e63dd03eda3b6e68857487138 --- /dev/null +++ b/full_models/tsz/vocab.txt @@ -0,0 +1,36 @@ +a +| +i +n +k +e +u +s +r +t +h +j +m +p +ï +c +á +d +g +o +b +é +í +ó +x +' +ú +l +– +f +î +- +́ +v +` + diff --git a/full_models/ttc/D_100000.pth b/full_models/ttc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..884854e460022a75b632b61c47effef4d85dd3e6 --- /dev/null +++ b/full_models/ttc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60a44caa7483fe06cda148101f61d86999f751edb5e3f297b3ea715315bba1e +size 561078879 diff --git a/full_models/ttc/G_100000.pth b/full_models/ttc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..82b9be47ecda33609ba4685c652cb4dcb9b02f43 --- /dev/null +++ b/full_models/ttc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57992e230682b7f3fd232a3b331829b85dc50b802eb260a79192ad3c05498391 +size 436378704 diff --git a/full_models/ttc/config.json b/full_models/ttc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ttc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ttc/vocab.txt b/full_models/ttc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..429a5b221779c103626551a586b5e2899a899ace --- /dev/null +++ b/full_models/ttc/vocab.txt @@ -0,0 +1,37 @@ +— +d +n +j +a +r +á +f +e +_ +t +b +í +v +y +k +z +u +x +p +l +s +h +i +- +ú +o +q +m +ñ +g +é +w +c +' +ó + diff --git a/full_models/tte/D_100000.pth b/full_models/tte/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cdaba6f05fc0ed96995492ae409ac4bf8a6ddc1a --- /dev/null +++ b/full_models/tte/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfd2529d481561c7088134eb98821d97b7ee2e51f29eb553613e69168451021 +size 561078700 diff --git a/full_models/tte/G_100000.pth b/full_models/tte/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..48e61a3321da37c96b8e4d46dd8edb544dc2fba4 --- /dev/null +++ b/full_models/tte/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abefa9d1dc80d58473f997b916e03c7949d3e823a26571a280e1f0c063d3f2f4 +size 436355160 diff --git a/full_models/tte/config.json b/full_models/tte/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tte/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tte/vocab.txt b/full_models/tte/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f7320679680fea2325f5edcec1cb124847e49bd4 --- /dev/null +++ b/full_models/tte/vocab.txt @@ -0,0 +1,28 @@ +1 +w +6 +y +' +t +- +p +s +m +n +v +b +4 +f +l +_ +k +a +o +3 +g +i +d +u +0 + +e diff --git a/full_models/ttq-script_tifinagh/D_100000.pth b/full_models/ttq-script_tifinagh/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..7f49f2f20b36f2eb4a56d4a1b4acc67304686d2e --- /dev/null +++ b/full_models/ttq-script_tifinagh/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ba0c5bba8f766ab66d41d735408551208328343aee0b430731a2490e34098a9 +size 561079012 diff --git a/full_models/ttq-script_tifinagh/G_100000.pth b/full_models/ttq-script_tifinagh/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..ab4154e4d110d944e6bca84a36c9329ee3a11cce --- /dev/null +++ b/full_models/ttq-script_tifinagh/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6456c123ef8e96123c21ffce76cc1ebc356b30ebccbf519b5156f85faf98fad0 +size 436355466 diff --git a/full_models/ttq-script_tifinagh/config.json b/full_models/ttq-script_tifinagh/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ttq-script_tifinagh/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ttq-script_tifinagh/vocab.txt b/full_models/ttq-script_tifinagh/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9d8d9bb4b08bdca333d077df55085a117fb85428 --- /dev/null +++ b/full_models/ttq-script_tifinagh/vocab.txt @@ -0,0 +1,26 @@ +| +ⵏ +ⵜ +ⴹ +ⵙ +ⵓ +ⵍ +ⵎ +ⵔ +ⴰ +ⵢ +ⵗ +ⴾ +ⴶ +ⵤ +⵿ +ⴼ +ⵛ +ⵀ +ⵂ +ⵆ +ⵈ +ⵌ +' +ⵑ + diff --git a/full_models/tue/D_100000.pth b/full_models/tue/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1292ce14d0ae00228fef1716ac123aad92661a74 --- /dev/null +++ b/full_models/tue/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5bec8c90f987eb35677fe07c5df81b3757d5524d587f591601387cda7bcedca +size 561078596 diff --git a/full_models/tue/G_100000.pth b/full_models/tue/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4b1839b882a5d85e60a0107941979b0cb1b3a920 --- /dev/null +++ b/full_models/tue/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f60ec85edea370cebb24fc659e2b8a6cc14aad3b7702810a0f760064cc461c +size 436396629 diff --git a/full_models/tue/config.json b/full_models/tue/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tue/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tue/vocab.txt b/full_models/tue/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bbcd41f38d12313b07113fb97cb4f71f4bb9da22 --- /dev/null +++ b/full_models/tue/vocab.txt @@ -0,0 +1,46 @@ +| +r +i +a +̶ +e +u +c +ã +t +o +m +ĩ +n +ũ +p +s +d +g +y +j +w +b +õ +ñ +ẽ +é +á +ú +í +ó +́ +ṹ +q +l +h +ṍ +— +f +v +z +- +' +x +k + diff --git a/full_models/tuf/D_100000.pth b/full_models/tuf/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e5236f4ab37460427b8bc9368d4fdfb0a74ef267 --- /dev/null +++ b/full_models/tuf/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd448dd5585e8b255f9a36d91839bef67182a17e5860e8cc984769aabcede520 +size 561078837 diff --git a/full_models/tuf/G_100000.pth b/full_models/tuf/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..788b625f4e385e59cd13f833321aac207b00378f --- /dev/null +++ b/full_models/tuf/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1533af67dc1be615a6ae61f0cf1e3ce78fc180726faa1c26c9e1b2cd6c2bc81 +size 436375836 diff --git a/full_models/tuf/config.json b/full_models/tuf/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tuf/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tuf/vocab.txt b/full_models/tuf/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..836b28befbfaf3f60ae76945bccc1e0987edb31b --- /dev/null +++ b/full_models/tuf/vocab.txt @@ -0,0 +1,37 @@ +̃ +j +u +z + +y +_ +b +ñ +— +a +x +o +m +f +w +i +r +c +e +h +t +n +k +l +ó +s +v +d +p +- +á +í +ú +g +q +é diff --git a/full_models/tuk-script_arabic/D_100000.pth b/full_models/tuk-script_arabic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8ef19c36ab4917e4aeddc6bd8aadf54bf6ad3fcd --- /dev/null +++ b/full_models/tuk-script_arabic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:537e33a12238e8b9541316755589a97bf211f4893d826529408126187ff44455 +size 561077812 diff --git a/full_models/tuk-script_arabic/G_100000.pth b/full_models/tuk-script_arabic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..65df5d883b6e23d0f2e61b0cec645d68e0100643 --- /dev/null +++ b/full_models/tuk-script_arabic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4f50816a6cd4271da90686a29cc825f39e6b0573c365e1983cee9b6ccec664 +size 436375388 diff --git a/full_models/tuk-script_arabic/config.json b/full_models/tuk-script_arabic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tuk-script_arabic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tuk-script_arabic/vocab.txt b/full_models/tuk-script_arabic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a83f638888c9a94ede432074f55835394b3beba1 --- /dev/null +++ b/full_models/tuk-script_arabic/vocab.txt @@ -0,0 +1,41 @@ +ی +| +ا +ن +ر +ل +د +و +گ +م +س +ب +ه +ت +ق +ز +ش +پ +ک +آ +غ +چ +ع +خ +ج +ح +- +ف +ط +ص +‍ +ض +ظ +ئ +ث +ٰ +ذ +– +' +ژ + diff --git a/full_models/tuk-script_latin/D_100000.pth b/full_models/tuk-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..43a98fec08c2cce3cd0419e2af9c4736a83ce6dd --- /dev/null +++ b/full_models/tuk-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31b8942fd6bf5a5cabf9ed49235f4adfd34f695a6775ed946932655c2284bef4 +size 561078871 diff --git a/full_models/tuk-script_latin/G_100000.pth b/full_models/tuk-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d2e4baaa971744d8c5846c2b447f9398bc9ca328 --- /dev/null +++ b/full_models/tuk-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aec907fdac78857fe11574de05ba9b7c2895fc8af64b4d2e14af9943763735c +size 436377076 diff --git a/full_models/tuk-script_latin/config.json b/full_models/tuk-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tuk-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tuk-script_latin/vocab.txt b/full_models/tuk-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3ad5e7649a4cf3e0383169e058934de06be7babe --- /dev/null +++ b/full_models/tuk-script_latin/vocab.txt @@ -0,0 +1,36 @@ +ş +ý +b +m +y +w +ž +s +a +g +ü +h +' +z +_ +u +k +i +ň +d +f +o +t +ä +- +j +r +ö +– +n +ç +‐ + +p +l +e diff --git a/full_models/tuo/D_100000.pth b/full_models/tuo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..730b3752873ddad22c5c88d7e483279ea6cd0b78 --- /dev/null +++ b/full_models/tuo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed1aca1b446f7172d9841ea98f55a42ce079d1a080cb926e1263a13e5da78d9 +size 561078626 diff --git a/full_models/tuo/G_100000.pth b/full_models/tuo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d6f12ca007923742456cf427095bb5f82413f14c --- /dev/null +++ b/full_models/tuo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f895299caf684028bef22a46243d436176dd406ef548394166c69d5fb2a56891 +size 436398930 diff --git a/full_models/tuo/config.json b/full_models/tuo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tuo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tuo/vocab.txt b/full_models/tuo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cd6b00c5b643ce88df4b5a823f8f819faf91b8eb --- /dev/null +++ b/full_models/tuo/vocab.txt @@ -0,0 +1,47 @@ +| +a +e +r +i +ʉ +' +o +ã +c +t +n +s +m +w +u +j +p +ĩ +̃ +ẽ +õ +y +g +b +d +ñ +q +ũ +í +́ +l +ú +é +— +̶ +ó +á +f +h +v +ṍ +z +ṹ +k +x + diff --git a/full_models/tur/D_100000.pth b/full_models/tur/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..2dc79311301cb2c55ed3192dd89b1617c32ab8aa --- /dev/null +++ b/full_models/tur/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e3cf33b321d9a6a381697832751b9ff5d9b2cc5466f3db4c6bae2b04e1aec8 +size 561110637 diff --git a/full_models/tur/G_100000.pth b/full_models/tur/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..b0a1803d10da983733416f8d3cc083d8f2eae29e --- /dev/null +++ b/full_models/tur/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b111ce8ae133959fa22eba70b5609b240cbee3ec7e21e308d5d309d4ffa176e +size 436631681 diff --git a/full_models/tur/config.json b/full_models/tur/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tur/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tur/vocab.txt b/full_models/tur/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..71421ff99fb90d7b7beeb7517f570e66f856c377 --- /dev/null +++ b/full_models/tur/vocab.txt @@ -0,0 +1,43 @@ +d +h +e +ş +̇ +n +ü +û +î +ı +b +i + +â +_ +f +3 +r +z +c +m +v +p +' +ö +ğ +6 +0 +g +2 +u +a +k +j +ç +4 +l +y +t +o +1 +s +- diff --git a/full_models/tvw/D_100000.pth b/full_models/tvw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..449e9a8c1589d5e25366c8484adcd137e0b77250 --- /dev/null +++ b/full_models/tvw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26269bb4642e6256db7325b5a53507e9d7cc984de03c674ed57e536239adb6f +size 561078956 diff --git a/full_models/tvw/G_100000.pth b/full_models/tvw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a6e97603589a07dba47df3407b6509355bfff3b1 --- /dev/null +++ b/full_models/tvw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3606593223c9f7ebdfa6c284279feed26cef24e30f87c3ebda2aa638caddcb52 +size 436359946 diff --git a/full_models/tvw/config.json b/full_models/tvw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tvw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tvw/vocab.txt b/full_models/tvw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..11e6374a21aeddb675146dcd9258073da7ae095c --- /dev/null +++ b/full_models/tvw/vocab.txt @@ -0,0 +1,29 @@ +d +y +f +o +s +e +r +j +5 +w +l +b +k +i +a +h +c +n +4 +0 +u +_ +' +p +m +g + +t +- diff --git a/full_models/twb/D_100000.pth b/full_models/twb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..169c9fb05f9dca8f5764d5e9fc40ddc8e50da5de --- /dev/null +++ b/full_models/twb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019dde4cd12fe6f2e25ee735eb471bb7fb34be57f4230ce1ef166d93e3c957ec +size 561079014 diff --git a/full_models/twb/G_100000.pth b/full_models/twb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2c0ea617bd18738a17b8499109751217dd6b2a6a --- /dev/null +++ b/full_models/twb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d479d18b8d4443476e2b9a0598a139c0367b63b5199c3dc32193a74e57dba2c +size 436365290 diff --git a/full_models/twb/config.json b/full_models/twb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/twb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/twb/vocab.txt b/full_models/twb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..25705916c64c3bc1945bb6d368b1a52bec91d1b3 --- /dev/null +++ b/full_models/twb/vocab.txt @@ -0,0 +1,31 @@ +6 +i +o +d +3 +u +2 + +- +r +b +y +e +' +s +_ +g +w +1 +a +k +p +4 +t +f +0 +7 +l +v +m +n diff --git a/full_models/twe/D_100000.pth b/full_models/twe/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..51cde4b364d4dae99174005622cb7472302d937b --- /dev/null +++ b/full_models/twe/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aae8557e44ecff07e17c7db671daa0104b29c4a66d9e0ae8f19614e5366796f5 +size 561076028 diff --git a/full_models/twe/G_100000.pth b/full_models/twe/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..973afe5af28af6d6cd8eee34b3698b0a41a39103 --- /dev/null +++ b/full_models/twe/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e440e2dd1448e1a1aed7f8d501d627bbbf39ff78595e5d0b5efa5dae0cbfd98c +size 436338250 diff --git a/full_models/twe/config.json b/full_models/twe/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/twe/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/twe/vocab.txt b/full_models/twe/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1ea3f5163ed4aaa8d0d2edd08e085db599591b2e --- /dev/null +++ b/full_models/twe/vocab.txt @@ -0,0 +1,29 @@ +i +o +' +a +b +j +n +v + +g +h +f +x +y +u +e +m +- +w +k +p +q +_ +l +r +t +s +c +d diff --git a/full_models/twu/D_100000.pth b/full_models/twu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cc9ad08d32cba051040e2b2cde41fcd5f07b6c8e --- /dev/null +++ b/full_models/twu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed14d7b294f6e29fc6ac529ab9c916c6876a93812bfa980144d32a93bd14f895 +size 561078640 diff --git a/full_models/twu/G_100000.pth b/full_models/twu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..12a7ce1de13015ab2350789512c3604c4930a018 --- /dev/null +++ b/full_models/twu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad436699412a4228d4cb181c7545821971fccca23a9d236288e6f94ac37e87d1 +size 436357059 diff --git a/full_models/twu/config.json b/full_models/twu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/twu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/twu/vocab.txt b/full_models/twu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..02be69fbee1933ef67552754a7d4704456d6a7aa --- /dev/null +++ b/full_models/twu/vocab.txt @@ -0,0 +1,28 @@ +a +| +n +e +o +l +i +u +m +s +t +k +d +h +b +' +f +- +g +p +y +r +z +w +j +c +9 + diff --git a/full_models/txa/D_100000.pth b/full_models/txa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d1d8984b37c49fb9ee2557b040eff9d91a04a964 --- /dev/null +++ b/full_models/txa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca20ebe981d433e20ea1ba70b35890fb054007b7443632a2fb2616198130ddf +size 561079095 diff --git a/full_models/txa/G_100000.pth b/full_models/txa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..497bf13c4b5a4942c7efc8278d61b21776c39e24 --- /dev/null +++ b/full_models/txa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb66b15ae10cb53fc48f51c3996bb460cec915aae42e23383951c68d9e48f7e +size 436347623 diff --git a/full_models/txa/config.json b/full_models/txa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/txa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/txa/vocab.txt b/full_models/txa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bfaf80ddcd08d4803d1f98da263fc9be951d7522 --- /dev/null +++ b/full_models/txa/vocab.txt @@ -0,0 +1,23 @@ +y +' +m +h + +j +a +k +o +u +g +l +r +p +i +d +_ +- +n +s +b +w +t diff --git a/full_models/txq/D_100000.pth b/full_models/txq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f4ac0f8eebdd2cb4f7eb06c331274de5f243d399 --- /dev/null +++ b/full_models/txq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200d785f5221ee49be6a3c867beae3677f97cf310f6507247a8fce2b46a71e92 +size 561078611 diff --git a/full_models/txq/G_100000.pth b/full_models/txq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1be01ac5fac0d185e13f5e1cce16dc3cc3f1916e --- /dev/null +++ b/full_models/txq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf51dc2d4d52a0e0c5dea80dfd28d2399995b01433dd73b4e6a1add7c4ff8985 +size 436380374 diff --git a/full_models/txq/config.json b/full_models/txq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/txq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/txq/vocab.txt b/full_models/txq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..50ac23f6f38d59b9684bf92725e53e1c8275f171 --- /dev/null +++ b/full_models/txq/vocab.txt @@ -0,0 +1,39 @@ +y +r +ꞌ + +2 +5 +t +1 +g +a +4 +b +3 +0 +f +d +' +8 +o +m +k +s +- +w +_ +e +p +i +— +h +9 +6 +n +z +l +u +c +7 +j diff --git a/full_models/txu/D_100000.pth b/full_models/txu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ec15fcac27b1f7018d41416eb03ad88f50b61b21 --- /dev/null +++ b/full_models/txu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abde6a3e8b4155ee6fbd8352cf538c919051b891410213450b194e0f4bd26b9d +size 561076927 diff --git a/full_models/txu/G_100000.pth b/full_models/txu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a8edfd6ae7bd5fa9eaf7426dc078742b2d81991c --- /dev/null +++ b/full_models/txu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601bff9877775fd3f0c8cddc64e4535278aecf1579279d411db77a74b6f26c29 +size 436388149 diff --git a/full_models/txu/config.json b/full_models/txu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/txu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/txu/vocab.txt b/full_models/txu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c0b2ede2d45afb8e2c45c6260139b0d5339a9442 --- /dev/null +++ b/full_models/txu/vocab.txt @@ -0,0 +1,43 @@ +õ +' +2 +j +u +0 +ã +1 +3 +ĩ +ũ +9 +ê +ỳ +7 +8 +ô +m +a +6 +k +ẽ +— +w +o +4 +g +i +x +t +y +ỹ +e +5 +r +n +d + +h +à +p +b +_ diff --git a/full_models/tye/D_100000.pth b/full_models/tye/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8c5a39ba74a557ec6fbb1dfdee3f60ef3048dd3e --- /dev/null +++ b/full_models/tye/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07cade85e776b1f5beaf23baceded05675aff626dfb4be7ec0de17a04207490b +size 561078629 diff --git a/full_models/tye/G_100000.pth b/full_models/tye/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b7603e40bd6687f873801b5d49b75fb6804c995b --- /dev/null +++ b/full_models/tye/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893f73eb4a46a9ebb8946055dc92dc205c30084b73b9894e6d08b817e3a06e07 +size 436401200 diff --git a/full_models/tye/config.json b/full_models/tye/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tye/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tye/vocab.txt b/full_models/tye/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..02fad2c3fe11a76f70063f4ac68b94701c4a8dc0 --- /dev/null +++ b/full_models/tye/vocab.txt @@ -0,0 +1,48 @@ +r +l +_ +f +s +ḿ +í +v +ì +á +à +d +ã +ò +h +́ +ń +ó + +i +ǹ +b +o +j +ũ +̀ +z +è +g +w +u +c +é +m +ĩ +n +k +t +e +' +y +ɔ +ù +a +ɛ +̃ +p +ú diff --git "a/full_models/tzh-dialect_bachaj\303\263n/D_100000.pth" "b/full_models/tzh-dialect_bachaj\303\263n/D_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..dd9e9cf5f10ca79225bf977796d9444d1bdb6b5f --- /dev/null +++ "b/full_models/tzh-dialect_bachaj\303\263n/D_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4003ca4a1c70ff1134adae872672d6c744b8d71f510d0e0f3082e70e5cbaa1 +size 561077956 diff --git "a/full_models/tzh-dialect_bachaj\303\263n/G_100000.pth" "b/full_models/tzh-dialect_bachaj\303\263n/G_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..466361e26ff7abd3036ecaafb60f36c7c8895059 --- /dev/null +++ "b/full_models/tzh-dialect_bachaj\303\263n/G_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f9c7e3c4c5ff1ac84af68e23ed22e7c37cc30faa039d1b801871275f9d7a4f4 +size 436368015 diff --git "a/full_models/tzh-dialect_bachaj\303\263n/config.json" "b/full_models/tzh-dialect_bachaj\303\263n/config.json" new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ "b/full_models/tzh-dialect_bachaj\303\263n/config.json" @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git "a/full_models/tzh-dialect_bachaj\303\263n/vocab.txt" "b/full_models/tzh-dialect_bachaj\303\263n/vocab.txt" new file mode 100755 index 0000000000000000000000000000000000000000..b014551343f651c7556a396224bbda408f709c91 --- /dev/null +++ "b/full_models/tzh-dialect_bachaj\303\263n/vocab.txt" @@ -0,0 +1,36 @@ +| +a +t +c +e +i +l +' +u +h +o +n +s +y +b +m +j +x +p +w +r +q +d +- +ú +g +í +é +ó +f +á +z +v +ñ +6 + diff --git a/full_models/tzh-dialect_tenejapa/D_100000.pth b/full_models/tzh-dialect_tenejapa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fa93a65ed0e8dab360302fc1fb3563c5fa62fc9e --- /dev/null +++ b/full_models/tzh-dialect_tenejapa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150c61060b872f56e3df75d4f61971718cfa790af9bab0826ecb5b0348493459 +size 561078624 diff --git a/full_models/tzh-dialect_tenejapa/G_100000.pth b/full_models/tzh-dialect_tenejapa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7030b6e298a42b4fca8045c7b80a655a5100e5de --- /dev/null +++ b/full_models/tzh-dialect_tenejapa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a9ff33cd26fa4c43cd2dd2dc34bbda48bf5b3f1f2f0b725ff79d84f1044d8f +size 436375874 diff --git a/full_models/tzh-dialect_tenejapa/config.json b/full_models/tzh-dialect_tenejapa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tzh-dialect_tenejapa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tzh-dialect_tenejapa/vocab.txt b/full_models/tzh-dialect_tenejapa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..37ef3c212abe8e21cd411503bb261cfa452225dd --- /dev/null +++ b/full_models/tzh-dialect_tenejapa/vocab.txt @@ -0,0 +1,37 @@ +| +a +e +t +i +c +l +' +u +o +y +s +n +j +b +m +x +h +q +p +w +r +d +— +- +g +ú +ó +f +é +í +z +v +ñ +á +k + diff --git a/full_models/tzj-dialect_eastern/D_100000.pth b/full_models/tzj-dialect_eastern/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1a1e94c8ed39cd6afacd686666aebb3db9837033 --- /dev/null +++ b/full_models/tzj-dialect_eastern/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ed898bcdabab9fc56197362d32a85f8c6787c74229e5fe2364b47b26514867 +size 561078727 diff --git a/full_models/tzj-dialect_eastern/G_100000.pth b/full_models/tzj-dialect_eastern/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6ab429a3f996b61eb73fee295dc6e1a48005c7ee --- /dev/null +++ b/full_models/tzj-dialect_eastern/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57c8f9bb087a9d81d720560f1fb906b01683af926209bbef71b1612c358a1522 +size 436375973 diff --git a/full_models/tzj-dialect_eastern/config.json b/full_models/tzj-dialect_eastern/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tzj-dialect_eastern/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tzj-dialect_eastern/vocab.txt b/full_models/tzj-dialect_eastern/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..8518c33301522b7f72b221a021e856b82ae33165 --- /dev/null +++ b/full_models/tzj-dialect_eastern/vocab.txt @@ -0,0 +1,37 @@ +a +x +n +i +o +p +í +d + +_ +r +e +é +— +ú +' +m +l +j +b +y +z +u +ñ +c +k +h +w +s +t +- +v +á +f +q +g +ó diff --git a/full_models/tzj-dialect_western/D_100000.pth b/full_models/tzj-dialect_western/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b6f1f095d219aaa692888f9d728d4a107c75833 --- /dev/null +++ b/full_models/tzj-dialect_western/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0f1a34cd5d338cdfbd1fe42bc6a9820320cd317f1719ee17986c08af985a473 +size 561078624 diff --git a/full_models/tzj-dialect_western/G_100000.pth b/full_models/tzj-dialect_western/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..022abb31f4ffee2e4e565c54b3b92d2d60f587f9 --- /dev/null +++ b/full_models/tzj-dialect_western/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db56c617eba62cead234ffb467f39550673726116e4672a5c4cd9bca35fea005 +size 436375884 diff --git a/full_models/tzj-dialect_western/config.json b/full_models/tzj-dialect_western/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tzj-dialect_western/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tzj-dialect_western/vocab.txt b/full_models/tzj-dialect_western/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5bf3152adf46dc4c41a31689182e0768339c07ad --- /dev/null +++ b/full_models/tzj-dialect_western/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +j +n +c +' +e +o +r +t +u +h +l +k +m +x +w +q +b +s +p +z +y +d +g +— +í +ú +á +f +ó +é +v +̱ +ñ + diff --git a/full_models/tzo-dialect_chamula/D_100000.pth b/full_models/tzo-dialect_chamula/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..702d50b8df295ff357e9cd5bd7b04184d584b7bd --- /dev/null +++ b/full_models/tzo-dialect_chamula/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeba1a3f9c8aa5d66718180770d530acdbfcfb6d33686aca55e512b7a96fafcb +size 561078624 diff --git a/full_models/tzo-dialect_chamula/G_100000.pth b/full_models/tzo-dialect_chamula/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dbda91a33f3d6c3298c4bc42792b300b058e4ef1 --- /dev/null +++ b/full_models/tzo-dialect_chamula/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bf3d30f1cbe1041b82128293bcf7099d9b78554cf7713aeafcdc87be593c484 +size 436373669 diff --git a/full_models/tzo-dialect_chamula/config.json b/full_models/tzo-dialect_chamula/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/tzo-dialect_chamula/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/tzo-dialect_chamula/vocab.txt b/full_models/tzo-dialect_chamula/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..092898ac499c79f384fab842bf30892d42c67868 --- /dev/null +++ b/full_models/tzo-dialect_chamula/vocab.txt @@ -0,0 +1,36 @@ +| +a +t +i +c +l +u +' +e +o +j +n +s +x +b +y +h +m +v +q +p +r +d +— +- +í +g +f +á +ú +z +é +ó +k +ñ + diff --git "a/full_models/tzo-dialect_chenalh\303\263/D_100000.pth" "b/full_models/tzo-dialect_chenalh\303\263/D_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..f36bdc9ba32f747f86f813aea7b6af9894402536 --- /dev/null +++ "b/full_models/tzo-dialect_chenalh\303\263/D_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0565961a0995f4f1f7577809d7ea3d0e2864b4c6522484ee6ae329afd8afaafa +size 561078630 diff --git "a/full_models/tzo-dialect_chenalh\303\263/G_100000.pth" "b/full_models/tzo-dialect_chenalh\303\263/G_100000.pth" new file mode 100755 index 0000000000000000000000000000000000000000..cadc1dd67e0344219c09973505eb004901d2c302 --- /dev/null +++ "b/full_models/tzo-dialect_chenalh\303\263/G_100000.pth" @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15065431a39c9d26411f9f8e8348d383baed1052502b37f9020180db6ea70c3b +size 436373595 diff --git "a/full_models/tzo-dialect_chenalh\303\263/config.json" "b/full_models/tzo-dialect_chenalh\303\263/config.json" new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ "b/full_models/tzo-dialect_chenalh\303\263/config.json" @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git "a/full_models/tzo-dialect_chenalh\303\263/vocab.txt" "b/full_models/tzo-dialect_chenalh\303\263/vocab.txt" new file mode 100755 index 0000000000000000000000000000000000000000..82f25f860553ad505b17e3c2ae64b3fddbef2cbf --- /dev/null +++ "b/full_models/tzo-dialect_chenalh\303\263/vocab.txt" @@ -0,0 +1,36 @@ +| +a +c +i +l +t +' +u +o +e +n +s +j +h +b +y +x +m +v +q +p +r +d +— +g +z +- +í +f +ó +é +ú +á +k +ñ + diff --git a/full_models/ubl/D_100000.pth b/full_models/ubl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2426b9b8e847228875c081dacacf599567ba52e2 --- /dev/null +++ b/full_models/ubl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701f70bd7d086bea2aa9b24920df87ddbe02df6150eccbaaea96fbc6e2ab5e0f +size 561078894 diff --git a/full_models/ubl/G_100000.pth b/full_models/ubl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9041e5d886b3ebe85a41c2943dbd70256876c70d --- /dev/null +++ b/full_models/ubl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb7a67a13e65f313df70c7fe14edde89391c5e92f48deea188eee6d570434e9a +size 436378987 diff --git a/full_models/ubl/config.json b/full_models/ubl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ubl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ubl/vocab.txt b/full_models/ubl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b6a62609d3921d5544c8b2431f79e8edf3d765b4 --- /dev/null +++ b/full_models/ubl/vocab.txt @@ -0,0 +1,37 @@ +j +a +_ +' +k +e +w +i +f +u +o +d +n +l +5 +h + +- +v +4 +6 +p +t +3 +g +c +0 +b +m +2 +s +z +x +q +r +1 +y diff --git a/full_models/ubu/D_100000.pth b/full_models/ubu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6a40f354687aaae73fde7fdcfa57994226568e42 --- /dev/null +++ b/full_models/ubu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22dd2332637cfd53a0be8aba57c9bea55b635937634442691d6c6d53acdfef2b +size 561076182 diff --git a/full_models/ubu/G_100000.pth b/full_models/ubu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e6aa67b9a3dded4eb24eb98ba2672d26be63ec0e --- /dev/null +++ b/full_models/ubu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c1ca84e365f3fa6fa53fb144c1164ae95649af6059c2c7a2a694800b5d05c2a +size 436337475 diff --git a/full_models/ubu/config.json b/full_models/ubu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ubu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ubu/vocab.txt b/full_models/ubu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e4113b0c1fc5b5ad6e6bfb51cd2aad237063c351 --- /dev/null +++ b/full_models/ubu/vocab.txt @@ -0,0 +1,28 @@ +r + +i +' +o +ú +n +t +p +s +e +ó +í +m +w +a +u +_ +á +b +g +j +l +y +- +k +d +é diff --git a/full_models/udm/D_100000.pth b/full_models/udm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..19ac6d9fadc67edcbf929bf6356e6ba5e45426b2 --- /dev/null +++ b/full_models/udm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6f931b75ebf9f56d7971ba00dd356feaeffacb12149965ce4da93cbc49459da +size 561079224 diff --git a/full_models/udm/G_100000.pth b/full_models/udm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ce525c6b5a81a33af1fe9d5393046f33a3448cd1 --- /dev/null +++ b/full_models/udm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a058f5a420ccb6fa7587768779accf9072d989ff2a750c950c705251281b4f +size 436392001 diff --git a/full_models/udm/config.json b/full_models/udm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/udm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/udm/vocab.txt b/full_models/udm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ebc6210582c0b943c637a29e913a96b4b779820b --- /dev/null +++ b/full_models/udm/vocab.txt @@ -0,0 +1,42 @@ +в +я +ж +ӥ +й +ш +ӟ +ӵ +у +б +и +ӝ +- +о +щ +л +п +м +ю +ц +т +– +д +а +г +э +к +е +р +ё +ч + +ы +ь +ӧ +с +н +_ +ф +ъ +з +х diff --git a/full_models/udu/D_100000.pth b/full_models/udu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b58dd6bbc1915908c84e038177ff0e4ab3f01b8 --- /dev/null +++ b/full_models/udu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa2eb4eaad2466f1160ec2aa19da63a441ae768721515c3f5fbcabd039cd4da +size 561078730 diff --git a/full_models/udu/G_100000.pth b/full_models/udu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8782d2fcedcf80ad417d1409a30c08fbd56dad80 --- /dev/null +++ b/full_models/udu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d765e8d928db1b7bd98c78111de898f164f20a08067a9305ec542667d1bfb09 +size 436369234 diff --git a/full_models/udu/config.json b/full_models/udu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/udu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/udu/vocab.txt b/full_models/udu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..05dea52d9bedea017ca8b5bd0d1fb444686002fb --- /dev/null +++ b/full_models/udu/vocab.txt @@ -0,0 +1,34 @@ +| +i +a +m +o +n +k +u +d +h +e +s +' +t +l +w +g +b +y +r +p +j +̱ +c +ḵ +ṯ +ŋ +ẖ +— +– +̧ +f +- + diff --git a/full_models/uig-script_arabic/D_100000.pth b/full_models/uig-script_arabic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ada3d2ed9ccb24d28a8a68b0d8c9fc9f1811af8a --- /dev/null +++ b/full_models/uig-script_arabic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc380568f71647dcfa81dec8dd8b1fc5c21ce65d97d6aab36deb1bbf406cbd9f +size 561078637 diff --git a/full_models/uig-script_arabic/G_100000.pth b/full_models/uig-script_arabic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6b2e160276fcbd7f222ac1b54f05c206ec117ef0 --- /dev/null +++ b/full_models/uig-script_arabic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7e4ee97ac4ae7c8621725074f171730d8c0637bcb1e4eb929c2246d9222b4a +size 436385333 diff --git a/full_models/uig-script_arabic/config.json b/full_models/uig-script_arabic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/uig-script_arabic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/uig-script_arabic/vocab.txt b/full_models/uig-script_arabic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7b15865a1637b343cd9be648a9ce35554cec8d31 --- /dev/null +++ b/full_models/uig-script_arabic/vocab.txt @@ -0,0 +1,41 @@ +ى +| +ا +ە +ل +ن +ر +ۇ +د +ئ +ت +ق +م +ي +ب +س +ك +ش +ڭ +غ +پ +ې +ز +ۈ +و +ھ +چ +گ +خ +ۋ +ۆ +- +ج +ف +0 +1 +2 +6 +5 +4 + diff --git a/full_models/uig-script_cyrillic/D_100000.pth b/full_models/uig-script_cyrillic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9212c45f955da3c05a1dfe9f2843df60ab7de305 --- /dev/null +++ b/full_models/uig-script_cyrillic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab9e6b8cf88391a9fbc87b4fed7c22cd8f78ff1a7123b3a01f06ae47bacbb22d +size 561079123 diff --git a/full_models/uig-script_cyrillic/G_100000.pth b/full_models/uig-script_cyrillic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0cf123cf8ad755550fe46786f3d497d4aa0dc761 --- /dev/null +++ b/full_models/uig-script_cyrillic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:983d2cdb538eb2b1dd88dff980d85eec8cbe145ebbac2cbcb30318aafab7918e +size 436407096 diff --git a/full_models/uig-script_cyrillic/config.json b/full_models/uig-script_cyrillic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/uig-script_cyrillic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/uig-script_cyrillic/vocab.txt b/full_models/uig-script_cyrillic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..107ca6d58ffc5db649e9cda9913d2c03120e9bf6 --- /dev/null +++ b/full_models/uig-script_cyrillic/vocab.txt @@ -0,0 +1,48 @@ +ю +һ +­ +ә +х +_ +ь +й +е +м +г +ё +ч +б +қ +л +с +к +я +ф +т +о +4 +д +ж +ө +н +ш +ц +р +- +1 +з +2 +ң +0 +җ +у +ъ +а +ы + +в +п +и +— +ғ +ү diff --git a/full_models/ukr/D_100000.pth b/full_models/ukr/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6edbd6fcb9dbf1c3b41cc0805161cb3a0b8936e --- /dev/null +++ b/full_models/ukr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9783339c6af53892a065d9ac7e7c18ec2198d8d225aace7953de223f2c39ff48 +size 561078973 diff --git a/full_models/ukr/G_100000.pth b/full_models/ukr/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f536e42d2036a618e61bd75fc9d751b08c1fcdd --- /dev/null +++ b/full_models/ukr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c614d17abfc36f2ba21c2e46f1805567635918887d69e7f9b69d27070b017da2 +size 436383755 diff --git a/full_models/ukr/config.json b/full_models/ukr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ukr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ukr/vocab.txt b/full_models/ukr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0b49606d5480c11550d993794040f702dc9f8fd4 --- /dev/null +++ b/full_models/ukr/vocab.txt @@ -0,0 +1,39 @@ +| +о +а +и +в +н +і +т +с +е +р +д +л +у +м +п +к +б +я +з +г +й +ь +х +ч +ж +щ +ю +ш +ї +є +ц +— +' +ф +‐ +ґ +- + diff --git a/full_models/unr/D_100000.pth b/full_models/unr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..44b700fc6ad54fc367510fe21482261978383b5a --- /dev/null +++ b/full_models/unr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e13d59fd6f9b63be51f142fb3e11239083698978ccfaa079a703db1f92e7d4 +size 561075944 diff --git a/full_models/unr/G_100000.pth b/full_models/unr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4956c4d86a2f45721b818385a6e2dde48e12a3e8 --- /dev/null +++ b/full_models/unr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb215f45b2af6e918936f8c021f542fb0093efe137d3ef17aec80430918626bc +size 436395848 diff --git a/full_models/unr/config.json b/full_models/unr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/unr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/unr/vocab.txt b/full_models/unr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b726d451203122788a374280dde4d2702ee3e9f0 --- /dev/null +++ b/full_models/unr/vocab.txt @@ -0,0 +1,54 @@ +ହ +ଭ +ଙ +ା +ଜ +଼ +ଘ +ଏ +ଁ +ଫ +' +ୟ +କ +ଇ +ବ +ଖ +_ +ମ +ୁ +ଲ +ଚ + +ଗ +ି +ଉ +ଠ +ଦ +ସ +ଣ +ଷ +ଧ +ଶ +ତ +‍ +ୋ +ୱ +ଥ +୍ +ଂ +େ +ଛ +ଆ +ପ +ଞ +ଡ +ଅ +ଝ +ଟ +ଢ +ନ +ଯ +ୀ +ର +ଃ diff --git a/full_models/upv/D_100000.pth b/full_models/upv/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b618dc5bb05edd591cd4db252f4f9a3075d2d7dc --- /dev/null +++ b/full_models/upv/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b919eeb13e1c0aecee43b14ac0784f2638e49b03c53969a0e4465306cdb36cf4 +size 561079001 diff --git a/full_models/upv/G_100000.pth b/full_models/upv/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1fdd289e4817254ae3c40e65b32bdef81625218b --- /dev/null +++ b/full_models/upv/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a956bc735687178be6f0402d4f623daab82d2b62939d543b94773c5a0af3f490 +size 436364085 diff --git a/full_models/upv/config.json b/full_models/upv/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/upv/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/upv/vocab.txt b/full_models/upv/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..05b8ea6497a7f78f6c7791b88de952cdde86c85d --- /dev/null +++ b/full_models/upv/vocab.txt @@ -0,0 +1,31 @@ +ö +w +d +b +_ +p +l +r +' +2 +u +- +̃ +j +s +e + +o +g +v +6 +t +n +4 +a +0 +i +1 +m +k +5 diff --git a/full_models/ura/D_100000.pth b/full_models/ura/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..08c64acfa4c3043dca166a891803481d30966521 --- /dev/null +++ b/full_models/ura/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca18cf502275a6e62f65ba7dabd03748bee230d98515b0eda255d786593fd350 +size 561076179 diff --git a/full_models/ura/G_100000.pth b/full_models/ura/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fabcbef485e2d36087e09932162f14e1412ec8a9 --- /dev/null +++ b/full_models/ura/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:540fb31d59854e1f85c4421cc7f2df5616d3323ac5d5e4cac0826fad07387046 +size 436332982 diff --git a/full_models/ura/config.json b/full_models/ura/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ura/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ura/vocab.txt b/full_models/ura/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ea2ecb6020c5c412e9d5e8be88a7de0982d61355 --- /dev/null +++ b/full_models/ura/vocab.txt @@ -0,0 +1,26 @@ +a +| +n +e +i +c +u +o +r +h +t +j +s +l +b +q +m +f +d +- +p +y +g +v +ñ + diff --git a/full_models/urb/D_100000.pth b/full_models/urb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c3e60a6ea77d17b9abb055fde748b8da0fb8a669 --- /dev/null +++ b/full_models/urb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa06f961f4ba3b5ded2705586e8107ef50e595886f5688fdb33c30ee5a44af4 +size 561078242 diff --git a/full_models/urb/G_100000.pth b/full_models/urb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a54b7bcec8de2a2b127a79962e29f82259a2e36d --- /dev/null +++ b/full_models/urb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77c539a210f1a678964c8007802abc5e137224ff49e3cbc34c3d681ef9397846 +size 436393943 diff --git a/full_models/urb/config.json b/full_models/urb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/urb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/urb/vocab.txt b/full_models/urb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..afb80d499cf75d57613246ca46ce7db1f39713bc --- /dev/null +++ b/full_models/urb/vocab.txt @@ -0,0 +1,45 @@ +— +w +b +x +é +5 +n +g +t +ỹ +e +ý +' +8 +4 +o +ã +_ +h +2 +7 +j +õ +r +i +u +ú +m + +9 +d +k +a +ó +á +3 +0 +p +1 +y +ĩ +ũ +ẽ +6 +s diff --git a/full_models/urd-script_arabic/D_100000.pth b/full_models/urd-script_arabic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5feb74118d78abd4650770c6657a7b7b3d74f99 --- /dev/null +++ b/full_models/urd-script_arabic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4598537ab63b2afc262631aa9b760f7c927a28aaf158a9711a150bcb8a4e9ffe +size 561110485 diff --git a/full_models/urd-script_arabic/G_100000.pth b/full_models/urd-script_arabic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e586536a304fa4c2a10e653de540d865a50dd961 --- /dev/null +++ b/full_models/urd-script_arabic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:622324e7300492c905e751e58e8090922aab8e33cc9a876f48c1e3fe2dd9acdf +size 436666452 diff --git a/full_models/urd-script_arabic/config.json b/full_models/urd-script_arabic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/urd-script_arabic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/urd-script_arabic/vocab.txt b/full_models/urd-script_arabic/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..f5179139fdcf90030409c2675f01e0c44b81eb3d --- /dev/null +++ b/full_models/urd-script_arabic/vocab.txt @@ -0,0 +1,58 @@ +د +خ +آ +ؤ +' +چ +ط +8 +5 +ن +و +ے +أ +ل +گ +ا +ث +ق +ی +ص +3 +ڑ +ر +9 +2 +ئ + +7 +ت +ف +_ +ب +ظ +— +ش +4 +1 +غ +ع +ٰ +م +ھ +ض +ژ +ز +ک +ٹ +ذ +0 +ج +ۂ +6 +پ +ہ +ح +ڈ +ں +س diff --git a/full_models/urd-script_devanagari/D_100000.pth b/full_models/urd-script_devanagari/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c15e11dbbed67bc8782d8cce5f044eeef40bfa55 --- /dev/null +++ b/full_models/urd-script_devanagari/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130a9b2123fa377a54c495f7fa4a92c5640b8ecd70fc580e3596ed55f94cb8cf +size 561078484 diff --git a/full_models/urd-script_devanagari/G_100000.pth b/full_models/urd-script_devanagari/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5c3942c8142984bef3b60124e4be200303c16d08 --- /dev/null +++ b/full_models/urd-script_devanagari/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a5e0f2e352f3b53368158117a90f262de49e1905069222d8c4fd00551e104b +size 436448004 diff --git a/full_models/urd-script_devanagari/config.json b/full_models/urd-script_devanagari/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/urd-script_devanagari/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/urd-script_devanagari/vocab.txt b/full_models/urd-script_devanagari/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e94190e2d98541a598512002c917701ec08a9ebe --- /dev/null +++ b/full_models/urd-script_devanagari/vocab.txt @@ -0,0 +1,68 @@ +| +ा +क +े +र +ह +न +स +म +ी +त +ि +़ +ल +् +ो +ं +द +ज +ब +ु +य +प +ै +ग +व +ू +उ +ख +अ +आ +ए +ँ +इ +फ +श +औ +च +ई +थ +भ +- +ड +ौ +छ +झ +ट +ठ +ऐ +ओ +घ +ध +ऊ +ढ +0 +' +2 +1 +4 +5 +— +9 +ः +3 +7 +8 +6 + diff --git a/full_models/urd-script_latin/D_100000.pth b/full_models/urd-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a936f5254e8ab947880ae2012785a838726f9e47 --- /dev/null +++ b/full_models/urd-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58ec6979b6fad3d6233f5b70162ba89541a78ac8f469b3b88f9b0caea2cd0e58 +size 561078501 diff --git a/full_models/urd-script_latin/G_100000.pth b/full_models/urd-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..69f1462a5a4f0cf59f10c109e62b4a8c0a62012e --- /dev/null +++ b/full_models/urd-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a86eae6c850b637828edc71b68de3169e55891557ffe6a2fd38e60424062730 +size 436399270 diff --git a/full_models/urd-script_latin/config.json b/full_models/urd-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/urd-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/urd-script_latin/vocab.txt b/full_models/urd-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..076006f6a6f96cc0c8e6b6933631673ced5b1cf5 --- /dev/null +++ b/full_models/urd-script_latin/vocab.txt @@ -0,0 +1,47 @@ +| +a +h +ā +e +k +i +r +s +u +n +ī +m +t +ṅ +l +o +d +b +p +y +j +g +ū +w +z +c +q +ḳ +f +- +ṛ +ṭ +ġ +ḍ +' +0 +4 +2 +1 +5 +9 +3 +7 +8 +6 + diff --git a/full_models/urk/D_100000.pth b/full_models/urk/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..67ae220be725a99b853408ce41a40982bf167f9f --- /dev/null +++ b/full_models/urk/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deeaffe1673e8923626d3b34ac29fc4432c6965e7b2be0d10ffe4a7f43a94126 +size 561078633 diff --git a/full_models/urk/G_100000.pth b/full_models/urk/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..002973219bd0c27ce9de6a8bdd5c100a6ab79ad3 --- /dev/null +++ b/full_models/urk/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b12012953e2cda656a6deb8c31c0afa7f3ebf1d0a52332dce195390a92b208 +size 436405933 diff --git a/full_models/urk/config.json b/full_models/urk/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/urk/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/urk/vocab.txt b/full_models/urk/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4c30ad38c7b5772beb43b330df6797bb64a30f35 --- /dev/null +++ b/full_models/urk/vocab.txt @@ -0,0 +1,50 @@ +| +า +อ +ู +ะ +ี +ก +ั +เ +น +ด +ื +ต +ฮ +ซ +บ +ล +ม +ร +ญ +จ +โ +ป +ย +ฆ +ฌ +ง +ว +ิ +- +แ +ํ +ค +' +ุ +ึ +ฟ +ท +พ +ช +3 +0 +4 +6 +1 +` +2 +q +t + diff --git a/full_models/urt/D_100000.pth b/full_models/urt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6844efe46abaeb6458d265856320fa45661b75cb --- /dev/null +++ b/full_models/urt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dabb4016769cfce135bb227a22fb777cd25bd330d929004823f7c7e5dbb0f067 +size 561078623 diff --git a/full_models/urt/G_100000.pth b/full_models/urt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7876f138a9e2a4456bfd57072ca01c96181a0a94 --- /dev/null +++ b/full_models/urt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2daae8a06e9fc6c24d28c7d7ad1dcdc3d45405ea07237278ae5520657f3e05e2 +size 436380590 diff --git a/full_models/urt/config.json b/full_models/urt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/urt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/urt/vocab.txt b/full_models/urt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e5c8bb565c2e37eacd02dfeb6be69a88db0807e0 --- /dev/null +++ b/full_models/urt/vocab.txt @@ -0,0 +1,39 @@ +4 +8 +' + +ŋ +e +m +6 +r +g +d +5 +y +n +v +2 +h +t +_ +9 +i +u +- +b +3 +o +1 +a +ꞌ +p +f +s +j +k +w +7 +c +0 +l diff --git a/full_models/ury/D_100000.pth b/full_models/ury/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f5d197df9b8bd4ffc344736dc2319b88131a6a34 --- /dev/null +++ b/full_models/ury/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e007e4a9d9095637ab914b9d40c1ee9e161863899c6bcc3de14b54d016f3c2b +size 561078216 diff --git a/full_models/ury/G_100000.pth b/full_models/ury/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cfbd15081c2c1b356c59ce303766b41dba79163f --- /dev/null +++ b/full_models/ury/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917a3ac07cd8282d7ab07b5e9104359caec5a94fc2fea50fe6084c7e068997c3 +size 436387394 diff --git a/full_models/ury/config.json b/full_models/ury/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ury/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ury/vocab.txt b/full_models/ury/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..218f708b18d24257c6ca9004b0febc9acf70715e --- /dev/null +++ b/full_models/ury/vocab.txt @@ -0,0 +1,42 @@ +- +8 +ï +9 +z +s +1 +d +ë +3 +w +b +– +r +o +i +l +' +u +6 +5 +n +h +y +m +a +ꞌ +0 + +g +f +k +2 +7 +t +e +— +4 +_ +c +p +j diff --git a/full_models/usp/D_100000.pth b/full_models/usp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f51543dc5e2758d19efba9ef3843b160953ad5ac --- /dev/null +++ b/full_models/usp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b68ce1e81b28e84376ca283c6a74eaea91826160ca770e4d739c590538bb339 +size 561078589 diff --git a/full_models/usp/G_100000.pth b/full_models/usp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..87c58775be2903a3c8b06c9f58ef2d1c6ecf815b --- /dev/null +++ b/full_models/usp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fdd25f805d52cbec81da7f50ac73b415801014327849c7fd1eaefed56b16c17 +size 436371234 diff --git a/full_models/usp/config.json b/full_models/usp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/usp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/usp/vocab.txt b/full_models/usp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1b8913191b13d5c1a4eb655c5909e0c54e366b70 --- /dev/null +++ b/full_models/usp/vocab.txt @@ -0,0 +1,35 @@ +| +a +i +j +' +k +c +t +r +l +n +e +o +h +s +u +w +b +m +x +y +p +d +z +q +ú +é +g +í +f +ó +v +á +ñ + diff --git a/full_models/uzb-script_cyrillic/D_100000.pth b/full_models/uzb-script_cyrillic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..831d961bdd22f9a6133407cd71bf3be296b64cc3 --- /dev/null +++ b/full_models/uzb-script_cyrillic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b32f26d900e91955b7b39cc543400d66c8448dc27074f381388d264e8c164b16 +size 561078509 diff --git a/full_models/uzb-script_cyrillic/G_100000.pth b/full_models/uzb-script_cyrillic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8f81e8439935a6c22c7952d9ffff12eaf2fd4133 --- /dev/null +++ b/full_models/uzb-script_cyrillic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b38371e35610f97a92367162fb7d0b0b1b614ea3b896d3c56c8c6771513ed5d2 +size 436395019 diff --git a/full_models/uzb-script_cyrillic/config.json b/full_models/uzb-script_cyrillic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/uzb-script_cyrillic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/uzb-script_cyrillic/vocab.txt b/full_models/uzb-script_cyrillic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b7615016909b9cd783448b1027d16e92a1e155b2 --- /dev/null +++ b/full_models/uzb-script_cyrillic/vocab.txt @@ -0,0 +1,45 @@ +| +а +и +н +л +р +д +о +г +б +у +м +т +с +қ +к +з +ў +ш +е +й +ҳ +ч +х +в +э +ё +я +п +ғ +ж +ф +– +— +ю +ъ +0 +1 +2 +4 +6 +ь +3 +5 + diff --git a/full_models/vag/D_100000.pth b/full_models/vag/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..349eb5ba6457587235eebda7539c5356161762fb --- /dev/null +++ b/full_models/vag/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf8c1e07e08d07c4773f9eaff9f458d0bc3d744f444ff875c2bcceaf80452d6 +size 561078639 diff --git a/full_models/vag/G_100000.pth b/full_models/vag/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c3da27017bbcce97c589e066f8ffda981a5e8a1c --- /dev/null +++ b/full_models/vag/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2723097cb43a4a7239c66463e0c189baced4f5ec02047813004ab619937c7256 +size 436387530 diff --git a/full_models/vag/config.json b/full_models/vag/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vag/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vag/vocab.txt b/full_models/vag/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..45d08f766e65428374e158c71dc6e0ba8a8b2e43 --- /dev/null +++ b/full_models/vag/vocab.txt @@ -0,0 +1,42 @@ +| +a +i +n +u +ɛ +ᴐ +l +r +b +d +ŋ +w +e +k +g +m +h +z +s +y +t +p +o +f +c +j +í +á +ú +v +à +ń +́ +ì +' +ɔ +é +ó +2 +3 + diff --git a/full_models/vid/D_100000.pth b/full_models/vid/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..872948b0593bd017be0b4a3a9361d8a056d970d2 --- /dev/null +++ b/full_models/vid/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2793df396e1d9560f4c8514c70332fb2e366cf8280168daac8af71ae86b06d8 +size 561079353 diff --git a/full_models/vid/G_100000.pth b/full_models/vid/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..487e16007c13c72490061c27ab2ea0e6d4aadb51 --- /dev/null +++ b/full_models/vid/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97179e6c06eea990ce3d159ef2391c4d61c9db45dfc28ebdec0a216898bcd146 +size 436357123 diff --git a/full_models/vid/config.json b/full_models/vid/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vid/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vid/vocab.txt b/full_models/vid/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fd101818347bb8666873bf7f767654197f6ac4f2 --- /dev/null +++ b/full_models/vid/vocab.txt @@ -0,0 +1,26 @@ + +m +z +e +_ +t +g +a +w +c +n +f +d +j +i +k +u +v +s +l +p +b +o +' +h +y diff --git a/full_models/vie/D_100000.pth b/full_models/vie/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..84d0178a395d748102e2e47110c1a7ceb59b42f4 --- /dev/null +++ b/full_models/vie/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4858021a9be6481af09bc118b95ed913933de5af5f8be7eccbfc55e7c51ec71 +size 561110394 diff --git a/full_models/vie/G_100000.pth b/full_models/vie/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..31b5cbb010446b07e4f008f96538e3bc7802db6b --- /dev/null +++ b/full_models/vie/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b2b87b80d276abe2ea83c60f7c1b57b7f76b113c8ef2724ca408a7efb93abe +size 436750766 diff --git a/full_models/vie/config.json b/full_models/vie/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vie/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vie/vocab.txt b/full_models/vie/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..d441eea3c45419425c6c4e3275b45f0e734be22e --- /dev/null +++ b/full_models/vie/vocab.txt @@ -0,0 +1,95 @@ +ụ +x +s +è +ì +ặ +ứ +ơ +u +ư +ằ +ỳ +â +c +v +ệ +ồ +_ +ỵ +ộ +ẻ +g +ạ +ĩ +ả +õ +ỡ +ẳ +ô +a +i +o +ừ +ỹ +ổ +à +ờ +ý +ù +– +ề +ễ +ẵ +ỏ +' +ò +ố +q +ọ +ẩ +ự +ã +2 +ị +e +đ +ó +ầ +é +ớ +ế +ủ +ử +d +ữ +ắ +ẽ +ẫ +m +ể +ũ +ỉ +ẹ +ỗ +í +y +ú +á +p +k +t +ấ +l +ở + +h +ỷ +ậ +b +ă +n +ê +r +ợ +- diff --git a/full_models/vif/D_100000.pth b/full_models/vif/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..52b45aef84d20ac51a1755f2e64c43e7d6542527 --- /dev/null +++ b/full_models/vif/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71809410f87943754e29d14a54e4eef03cfa8ea06591c2c1b88518f109db62ff +size 561078840 diff --git a/full_models/vif/G_100000.pth b/full_models/vif/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0905930e7150ef423382aac341075ee06a40b9f1 --- /dev/null +++ b/full_models/vif/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c12ea2c803b397bb7043a7482062f0c3ce53623e11d23faa704762e2d614f85d +size 436363270 diff --git a/full_models/vif/config.json b/full_models/vif/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vif/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vif/vocab.txt b/full_models/vif/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f6d7c85815e31c8ea0bafffbc8186854d1c4507a --- /dev/null +++ b/full_models/vif/vocab.txt @@ -0,0 +1,30 @@ +v +— +a +o +d +c +_ +b +- +g +‐ +n +k +e +p +t +f +i +ê +ë + +u +m +w +y +s +l +j +z +' diff --git a/full_models/vmw/D_100000.pth b/full_models/vmw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0b96a2f556837b8c18cb949cd905bf8819d73805 --- /dev/null +++ b/full_models/vmw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59508ea71caed12e3831bcfa365fe6e8b3e246274fdb8da2d21d3359e2701ca4 +size 561079239 diff --git a/full_models/vmw/G_100000.pth b/full_models/vmw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..96ab0f352ab82fd8d20d65acb4aee9dc41818fc6 --- /dev/null +++ b/full_models/vmw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3213b0c247a616479e229d6a09d45534084ec93aa6f30f3c7019bb74b033905f +size 436363477 diff --git a/full_models/vmw/config.json b/full_models/vmw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vmw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vmw/vocab.txt b/full_models/vmw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..13bb2eb02c5b3d8659a46a53c95168e0580e7f2a --- /dev/null +++ b/full_models/vmw/vocab.txt @@ -0,0 +1,29 @@ +t +f +h +c +x +- +m +i +' +b +u +e +r +d +k +y +w +p +l +g +n +s +v + +a +o +j +_ +2 diff --git a/full_models/vmy/D_100000.pth b/full_models/vmy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..05f86671ac2dc8581da6c20179ae30c41d955fb1 --- /dev/null +++ b/full_models/vmy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:139c2a424915e91752307f1d8de3d1979b7e6a89f37471ba6bce65553ceb9f1d +size 561078845 diff --git a/full_models/vmy/G_100000.pth b/full_models/vmy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c964fa19125299e7003cb32247788ebbf5eb0979 --- /dev/null +++ b/full_models/vmy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db56acee8b4043a7a0cc7a1ede1922c8e3270f046f82069611e54f7f2370607 +size 436375014 diff --git a/full_models/vmy/config.json b/full_models/vmy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vmy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vmy/vocab.txt b/full_models/vmy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bb543d8a2fd9b616d4dc947231d04fdeec1c2838 --- /dev/null +++ b/full_models/vmy/vocab.txt @@ -0,0 +1,35 @@ +l +x +i +í +u +b +k +é +v +ñ +n +q +r +f +c +o +e +p +t +m +_ +s +á +d +g +' +ó +a +z +h +ú + +̱ +j +y diff --git a/full_models/vun/D_100000.pth b/full_models/vun/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b74697cbea89efff7b56c71a1f39e852f9407c9d --- /dev/null +++ b/full_models/vun/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ebdabf860d1653db45b0e5893545533f32a7981c2a728781865eef1ab6f12d +size 561078702 diff --git a/full_models/vun/G_100000.pth b/full_models/vun/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..27a0077d42ba3dae43b9b411263bc73da419849e --- /dev/null +++ b/full_models/vun/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04af539329f6fff51fa46d233d917b4d4ba92609bcfb5e9603e27ded986e44ef +size 436361968 diff --git a/full_models/vun/config.json b/full_models/vun/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vun/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vun/vocab.txt b/full_models/vun/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..97a9411adc999c48f4478ec3be0296f7d4fe7eee --- /dev/null +++ b/full_models/vun/vocab.txt @@ -0,0 +1,30 @@ +| +a +i +y +n +o +u +k +e +w +m +l +s +h +g +d +r +ṙ +c +f +ṟ +t +p +b +- +' +j +z +v + diff --git a/full_models/vut/D_100000.pth b/full_models/vut/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c377e3d7cd2c318364e735f35b02ea8d70ba9264 --- /dev/null +++ b/full_models/vut/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862943fd62805a883eb6944530e3f15e50b84a5cb5d698f22671537c6a816f97 +size 561078837 diff --git a/full_models/vut/G_100000.pth b/full_models/vut/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2de22964bbcf98f98209e17762e7569147362a48 --- /dev/null +++ b/full_models/vut/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899384fd53c672c01e0733f69066d0562eb404826ac4edb495472e183060d42d +size 436411867 diff --git a/full_models/vut/config.json b/full_models/vut/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/vut/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/vut/vocab.txt b/full_models/vut/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f2c05c19e6796722dc266ae2641f9df4b8584dc3 --- /dev/null +++ b/full_models/vut/vocab.txt @@ -0,0 +1,51 @@ +w + +̧ +ȩ +́ +b +ê +ɨ +s +y +à +ô +ə +c +è +o +d +_ +ɗ +k +v +p +l +t +ɓ +é +á +̀ +m +g +ì +n +h +j +u +i +û +r +í +î +̂ +ó +a +ú +ò +ŋ +ù +ɔ +â +e +f diff --git a/full_models/wal-script_ethiopic/D_100000.pth b/full_models/wal-script_ethiopic/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ded77e618a4265068f2df74e2b78f6e91440c8d1 --- /dev/null +++ b/full_models/wal-script_ethiopic/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:753ce02418a2e0778ff2af104febbffaea413547701015ac80820e36d589fe1b +size 561078222 diff --git a/full_models/wal-script_ethiopic/G_100000.pth b/full_models/wal-script_ethiopic/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d226c770354540aefb30794769704a6756348ec9 --- /dev/null +++ b/full_models/wal-script_ethiopic/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9aea9e079fe5aa847d3cf42c847b42309663be265b91c9227eb16d46134664d +size 436697702 diff --git a/full_models/wal-script_ethiopic/config.json b/full_models/wal-script_ethiopic/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wal-script_ethiopic/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wal-script_ethiopic/vocab.txt b/full_models/wal-script_ethiopic/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..79f8e3c6b98896bf7204c4d029d4cbc4a7ae81b9 --- /dev/null +++ b/full_models/wal-script_ethiopic/vocab.txt @@ -0,0 +1,178 @@ +| +ን +ስ +ይ +ነ +አ +ተ +እ +ት +ሰ +ያ +ደ +ዮ +ቴ +ድ +ግ +ኔ +ር +መ +ዶ +ዴ +በ +ኤ +ው +ጋ +ጌ +ከ +ዎ +ኦ +ረ +የ +ሀ +ታ +ኮ +ፔ +ኡ +ለ +ና +ዬ +ዋ +ሄ +ጦ +ሳ +ቀ +ሽ +ገ +ባ +ም +ጊ +ሱ +ሸ +ሶ +ል +ቶ +ቱ +ኑ +ቤ +ኣ +ክ +ኬ +ሮ +ዳ +ማ +ላ +ጎ +ቦ +ወ +ሁ +ሜ +ሴ +ሬ +ቆ +ብ +ቅ +ሃ +ጠ +ዘ +ሎ +ጥ +ቲ +ራ +ቃ +ሌ +ሞ +ጉ +ፕ +ፈ +ኪ +ቸ +ፐ +ቢ +ህ +ሙ +ዪ +ሲ +ጣ +ጤ +ዱ +ቄ +ሻ +ቁ +ኩ +ች +ሼ +ጴ +ሚ +ፖ +ኢ +ሉ +ጭ +ዽ +ጵ +ካ +ፑ +ፍ +ዝ +ጨ +ሹ +ጰ +ኖ +ዜ +ጫ +ዛ +ሩ +ሺ +ሾ +ዉ +ጬ +ሊ +ፌ +ፋ +ዞ +ሆ +ዲ +ቹ +ጡ +ቻ +ዙ +ዩ +ሪ +ፓ +ቾ +ፉ +ቂ +ቡ +ዌ +ቺ +ጄ +ቼ +ጩ +ኒ +ሂ +ጮ +ጢ +ፊ +ጪ +ዚ +ጶ +ዸ +ዺ +ጅ +ፎ +ጁ +ጀ +ዼ +ጱ +- +ፒ +ጆ +ጳ +ጃ +ጂ +ዾ +ጲ +ኙ +ዻ +ዹ + diff --git a/full_models/wal-script_latin/D_100000.pth b/full_models/wal-script_latin/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b9c47f3acb9519eb2134d253d4961e284452c7d5 --- /dev/null +++ b/full_models/wal-script_latin/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6402a45f69fef696d93b389df5e38d5921f0035fd4ad82085ec975c3df35f34 +size 561078602 diff --git a/full_models/wal-script_latin/G_100000.pth b/full_models/wal-script_latin/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f4358877e14caec7c6bf486800554905dc7065d8 --- /dev/null +++ b/full_models/wal-script_latin/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a585dea3c6bb0ee497fcea8606911ae3107a9c6d2fa3d4d74ad2747949dd041 +size 436359877 diff --git a/full_models/wal-script_latin/config.json b/full_models/wal-script_latin/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wal-script_latin/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wal-script_latin/vocab.txt b/full_models/wal-script_latin/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bb2e8cb07c55705d8ceef4582ec60b06615ba6f3 --- /dev/null +++ b/full_models/wal-script_latin/vocab.txt @@ -0,0 +1,30 @@ +a +| +i +e +s +o +n +t +d +y +h +u +g +k +b +m +r +p +l +w +q +x +7 +c +z +f +' +j +- + diff --git a/full_models/wap/D_100000.pth b/full_models/wap/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ffe5f4a796b179aa7b362eb679fd6ed62324e6df --- /dev/null +++ b/full_models/wap/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e256d5f6d0d15db558bfbc3005eec096442dfcb626bb901a097a23b8029047bd +size 561078635 diff --git a/full_models/wap/G_100000.pth b/full_models/wap/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..62c5f7d2943a3b493c16b187801bde046f60f667 --- /dev/null +++ b/full_models/wap/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b439b6296323e04a472c898e9094b44823c78a1fe445f67961811be369a407d +size 436389585 diff --git a/full_models/wap/config.json b/full_models/wap/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wap/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wap/vocab.txt b/full_models/wap/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..047da0a272176340a97376d1471b7bba5c707605 --- /dev/null +++ b/full_models/wap/vocab.txt @@ -0,0 +1,43 @@ +ã +z +p +m +3 +b +s +' +u +i +o +q +h +n +5 +õ +e +- +8 +a +y +0 +2 +l +7 +k +x +g +j +w + +r +c +t +f +d +9 +1 +4 +_ +6 +v +ĩ diff --git a/full_models/war/D_100000.pth b/full_models/war/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0c6f7d4ec69fce5a177f42642a777862cc060c90 --- /dev/null +++ b/full_models/war/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b9a29602c2d9761372bedca030121426ef80a2304d964e5d68eb394779edf9 +size 561078708 diff --git a/full_models/war/G_100000.pth b/full_models/war/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..94d7e9b1db9b0711b93c24b3270118d85ca9d9f9 --- /dev/null +++ b/full_models/war/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1ab1673d52886bcb614940b9f9f86448768f8e46a426388bc0ab0cfb3d7cc4 +size 436387508 diff --git a/full_models/war/config.json b/full_models/war/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/war/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/war/vocab.txt b/full_models/war/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7be05258877a0e0594d1fd7d4719c56c1f161a57 --- /dev/null +++ b/full_models/war/vocab.txt @@ -0,0 +1,42 @@ +a +| +n +i +g +o +h +t +k +m +u +s +d +y +p +r +l +b +w +e +- +j +c +f +— +v +q +z +0 +4 +1 +2 +x +' +5 +3 +8 +9 +7 +ñ +6 + diff --git a/full_models/waw/D_100000.pth b/full_models/waw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..382a0c0ec0eb3c37853930edb4b67a561ffd10dc --- /dev/null +++ b/full_models/waw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ceb94c9e1283f63013fc85acac71f9abbadf82e8e26efe57f987af8fa67b1ce +size 561077737 diff --git a/full_models/waw/G_100000.pth b/full_models/waw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9f8ee128da532fcad52ef0f4f91f32d15618fdcf --- /dev/null +++ b/full_models/waw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6eef564ea7874986e2d2e0fbbbfde9c7d7ecf0c38c82d377c91f4c8604b4cf +size 436368599 diff --git a/full_models/waw/config.json b/full_models/waw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/waw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/waw/vocab.txt b/full_models/waw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..be0eccd57d39797093338674efdd59556e3305c6 --- /dev/null +++ b/full_models/waw/vocab.txt @@ -0,0 +1,34 @@ +| +a +o +e +k +n +r +m +t +î +w +h +y +̂ +p +i +s +x +c +u +b +0 +1 +2 +7 +4 +3 +5 +- +6 +8 +9 +d + diff --git a/full_models/way/D_100000.pth b/full_models/way/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9e45368ab454c4fd8f467b31c9db6ad93c3af2cd --- /dev/null +++ b/full_models/way/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b13cef65fb21205761b2c646be03ef3178e89159b59290f969d5e37b67d73c4d +size 561078974 diff --git a/full_models/way/G_100000.pth b/full_models/way/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ce873c2ab8981368fbbe9afa87bc2946eabc9447 --- /dev/null +++ b/full_models/way/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e46ac52fe8b220e52623e35dd0e0ca6fd6c7dbae19dadfc3ba4492a1c7f8a4b +size 436361925 diff --git a/full_models/way/config.json b/full_models/way/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/way/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/way/vocab.txt b/full_models/way/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..17b1773a06aba8fc8e1e640756270746f676e2b9 --- /dev/null +++ b/full_models/way/vocab.txt @@ -0,0 +1,29 @@ +| +a +ë +m +e +t +o +k +n +p +i +l +ï +h +u +w +j +s +0 +1 +2 +7 +4 +3 +5 +6 +9 +8 + diff --git a/full_models/wba/D_100000.pth b/full_models/wba/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..494af2495c9b35f2556b2f04fb598b84ff1a7b6e --- /dev/null +++ b/full_models/wba/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143292f98e7c5cf702b8351e41941cced9c4df8f059c5bd7481664a8fd6ebad5 +size 561078877 diff --git a/full_models/wba/G_100000.pth b/full_models/wba/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..38e57668a0e796dfc47297e135a4b5b2603372fe --- /dev/null +++ b/full_models/wba/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fed4ec36cee6dfdb6c77c68b590ee120504329d76aaad5109b03df949505a10 +size 436379008 diff --git a/full_models/wba/config.json b/full_models/wba/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wba/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wba/vocab.txt b/full_models/wba/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..17374005e4c2ab423ddf4268d695ba3860265199 --- /dev/null +++ b/full_models/wba/vocab.txt @@ -0,0 +1,37 @@ +e +n +m +x +q +i +á +í +é +k +o +g +y +r +z +ó +d + +_ +s +h +c +v +w +l +b +ã +a +u +f +ñ +t +p +õ +- +j +ú diff --git a/full_models/wlo/D_100000.pth b/full_models/wlo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..eb60f5e0b295e6d6de241e528d0f6beed8b34a66 --- /dev/null +++ b/full_models/wlo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd475c91ffc8988e171b0bfb11f25e29d69d22dc0421e330c308922605092db3 +size 561076071 diff --git a/full_models/wlo/G_100000.pth b/full_models/wlo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3e43de545b7721bbdd1cf4287e4c9ad6b50a031a --- /dev/null +++ b/full_models/wlo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19c7ad6cab6427433c545285a80dd63164eb15d3664045fe76fb96d64b53bea +size 436336435 diff --git a/full_models/wlo/config.json b/full_models/wlo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wlo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wlo/vocab.txt b/full_models/wlo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0deb9da065fd8d65d395315018f2496a352d2913 --- /dev/null +++ b/full_models/wlo/vocab.txt @@ -0,0 +1,28 @@ +c +a +h +j +k +o + +f +i +' +d +p +ʼ +l +_ +r +w +z +s +e +m +t +g +n +u +- +b +y diff --git a/full_models/wlx/D_100000.pth b/full_models/wlx/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d90471aa2dbc5b025265f0fa459d9f3c5fe2714a --- /dev/null +++ b/full_models/wlx/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0617065bb06e2d9dbdd257222afa0a32df276a163c09cf24bfa381374050de75 +size 561079378 diff --git a/full_models/wlx/G_100000.pth b/full_models/wlx/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..95339c03ac9f2bfcc40a092c6b7e366e4f815e13 --- /dev/null +++ b/full_models/wlx/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe8b989232b805d5f8aae6243fc9411668f5ce25d51661c7b9de56664bb2380 +size 436375244 diff --git a/full_models/wlx/config.json b/full_models/wlx/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wlx/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wlx/vocab.txt b/full_models/wlx/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5bab264e26567c4bef87d9d16fef829b90cb3d43 --- /dev/null +++ b/full_models/wlx/vocab.txt @@ -0,0 +1,34 @@ +o +9 +4 +w +h +k +m +q +5 +' +x +z +1 +_ +d +e +y +c +v +r +p +t +i +a +n +b +u +s + +j +g +f +- +l diff --git a/full_models/wmw/D_100000.pth b/full_models/wmw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bf42e37488cd6874e57ac7a9f8a429de64843dbe --- /dev/null +++ b/full_models/wmw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a207dac57c3152962e003b25c05b0917a610d88be74a67b5f6448eed7b87c8 +size 561078854 diff --git a/full_models/wmw/G_100000.pth b/full_models/wmw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..56f49aacc26d0b8d257953025305079ac364b9e7 --- /dev/null +++ b/full_models/wmw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6015d9792d9bb4490723601f056c941b526ad3cdef9f6e7bba03e661f800a7d9 +size 436389172 diff --git a/full_models/wmw/config.json b/full_models/wmw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wmw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wmw/vocab.txt b/full_models/wmw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..bc448a84f5c39dcccf2d0a53a93adf195e436aee --- /dev/null +++ b/full_models/wmw/vocab.txt @@ -0,0 +1,41 @@ +a +| +i +u +n +w +k +e +m +o +y +r +s +l +t +b +p +d +z +g +j +f +v +h +‐ +c +á +' +- +í +é +â +ú +ã +ó +î +û +ê +ô +ũ + diff --git a/full_models/wob/D_100000.pth b/full_models/wob/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..66b42f6d4dae1719298a24f456bf9ef42cf386f3 --- /dev/null +++ b/full_models/wob/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b562d2c86cfd0088aea78f40fbf6103b4d744798eb689ea10e747200a85a9460 +size 561078838 diff --git a/full_models/wob/G_100000.pth b/full_models/wob/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ed60116708eb1b65b2261b6846342bd5c410b1b1 --- /dev/null +++ b/full_models/wob/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3607a5fb90ef89e5e4ea6f581d3a2d3da85c2bbc6be1742ab3c2b642538474 +size 436365303 diff --git a/full_models/wob/config.json b/full_models/wob/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wob/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wob/vocab.txt b/full_models/wob/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..62a8140527d5dbdaad7955b15dc3dd91cfa55dd4 --- /dev/null +++ b/full_models/wob/vocab.txt @@ -0,0 +1,31 @@ +| +' +a +‐ +e +n +ɛ +ʋ +i +ɔ +k +ɩ +o +d +s +m +w +j +u +t +p +b +l +y +r +c +g +f +- +v + diff --git a/full_models/wsg/D_100000.pth b/full_models/wsg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..35ebb12b6f1ec40c0b6464c37a3fe691f8549a7c --- /dev/null +++ b/full_models/wsg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e992475aef109913c449016d0ccfa6afcb36dcdd0686254e69e4d090b8b7a818 +size 561079242 diff --git a/full_models/wsg/G_100000.pth b/full_models/wsg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c9a359d6951830333fe08361ca935e0dda7de109 --- /dev/null +++ b/full_models/wsg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecfe593edfd2f9abfcc8182df43d753f74dd217b70fcc50f480308f961799754 +size 436391740 diff --git a/full_models/wsg/config.json b/full_models/wsg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wsg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wsg/vocab.txt b/full_models/wsg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4aef659755273b8b17c3ba5fe839fbcd4c0f4722 --- /dev/null +++ b/full_models/wsg/vocab.txt @@ -0,0 +1,42 @@ +ల +చ +ద +ు +ా +ం +ప +ఆ +ఒ +ె +_ +k +అ + +ే +ఎ +య +ి +బ +ర +మ +వ +్ +క +ూ +ఈ +స +జ +ొ +ఊ +డ +ో +ీ +గ +హ +' +త +ఇ +న +- +ఉ +ట diff --git a/full_models/wwa/D_100000.pth b/full_models/wwa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..11cae93c6b7c4e78ac9c7afb7d7470ed9d071bdf --- /dev/null +++ b/full_models/wwa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48cb0d35b16b401672deb06facd9605412cea2100a3d0735e982606eb017369f +size 561078626 diff --git a/full_models/wwa/G_100000.pth b/full_models/wwa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c359621391f998236ff97cd7930b21bddd4e9b11 --- /dev/null +++ b/full_models/wwa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c31e74d407e1e5b343c1ce0e98a84f863880a854d9aad876e4c6279fec2645 +size 436373681 diff --git a/full_models/wwa/config.json b/full_models/wwa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/wwa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/wwa/vocab.txt b/full_models/wwa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e2fe1439a2212de873b78e10b9137bdbcc68e05b --- /dev/null +++ b/full_models/wwa/vocab.txt @@ -0,0 +1,36 @@ +| +a +i +n +t +d +o +m +b +r +e +s +u +y +k +ɛ +ɔ +à +w +p +ò +ŋ +ǹ +- +ì +f +c +̃ +ã +̀ +' +` +ĩ +ũ +2 + diff --git a/full_models/xal/D_100000.pth b/full_models/xal/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f838f0df1e3bb40d25851978af0e453ea9557509 --- /dev/null +++ b/full_models/xal/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:119bdb6a0b03a5a928cca835e06045447f8815d56bd7e848365a3c65d9d033ec +size 561079011 diff --git a/full_models/xal/G_100000.pth b/full_models/xal/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..165d3a2c5cb5feaa9dca74b0b5b92cd76c8edce0 --- /dev/null +++ b/full_models/xal/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8932949f3b5fc64ecdf3a5400de18431f08b7721eb57b0a2475bd276b44c69 +size 436406739 diff --git a/full_models/xal/config.json b/full_models/xal/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xal/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xal/vocab.txt b/full_models/xal/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..456063cd8741ef58913e70da1d2f5a68850b1c07 --- /dev/null +++ b/full_models/xal/vocab.txt @@ -0,0 +1,49 @@ +и +в +ю +ж +к +р +т +г + +ә +җ +д +_ +ч +п +х +ң +л +ө +ү +у +3 +ф +һ +о +б +ъ +0 +- +э +м +я +с +ё +а +е +й +з +1 +2 +– +6 +4 +н +ц +ѳ +ы +ш +ь diff --git a/full_models/xdy/D_100000.pth b/full_models/xdy/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b65c86269a797084d9d6829759d1cc459a0e512d --- /dev/null +++ b/full_models/xdy/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e0529d0bad93456b97caad99537599fe2ee16289c9e00e4ff5412c296b6216f +size 561075951 diff --git a/full_models/xdy/G_100000.pth b/full_models/xdy/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1313de04911a906bbb32bccc6a4c1be7440b7a14 --- /dev/null +++ b/full_models/xdy/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf654f467b9f27bd37a46551efdc462996211439b1d175a79a3feff6bf0f66e +size 436333734 diff --git a/full_models/xdy/config.json b/full_models/xdy/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xdy/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xdy/vocab.txt b/full_models/xdy/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e59612c1e93e40606f7f1c034170d8400fb09bc1 --- /dev/null +++ b/full_models/xdy/vocab.txt @@ -0,0 +1,27 @@ +m +b + +u +r +t +l +g +j +e +p +d +k +h +w +o +' +- +f +z +_ +i +a +c +s +n +y diff --git a/full_models/xed/D_100000.pth b/full_models/xed/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..83e7a98b94024302af4b8e38b04af809cef6e9cb --- /dev/null +++ b/full_models/xed/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7dbba84c18244b49e0c4b44a111fa056afcfca8d4577c123b7b26204642aa4 +size 561078997 diff --git a/full_models/xed/G_100000.pth b/full_models/xed/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..836aa5a93a87d4087c28b87c2f5b426df42c5949 --- /dev/null +++ b/full_models/xed/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b0d6f1d346a2d53cb3eb7864160cab37fbda767fdc2387c3840a8f1167e2edf +size 436363097 diff --git a/full_models/xed/config.json b/full_models/xed/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xed/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xed/vocab.txt b/full_models/xed/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5d8f74a64d9d6177d047c7e256d6e2d720e78c4d --- /dev/null +++ b/full_models/xed/vocab.txt @@ -0,0 +1,30 @@ +ŋ +h +b +k +ɗ +á +ɓ +w +t +ə +g +í +_ +n +m +f +a +d +ʼ +r +l +u +s +e +z + +p +v +i +y diff --git a/full_models/xer/D_100000.pth b/full_models/xer/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8a1d2eea92a842c247cd7f9062f1830dde2188e3 --- /dev/null +++ b/full_models/xer/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c2c523bf2c16191e5190e1d031fb18f92e701931fa07937412335605eba74f +size 561076157 diff --git a/full_models/xer/G_100000.pth b/full_models/xer/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7331aec9463a29b196714c99d8cae85907a07f0e --- /dev/null +++ b/full_models/xer/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d883bc7de17f1eab88480af05dde87d6f271bc8fb8e3472a0a3505d369c6d96b +size 436396841 diff --git a/full_models/xer/config.json b/full_models/xer/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xer/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xer/vocab.txt b/full_models/xer/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..590c3cdfeb48c820bbd0db2fc93ed2a0f214b49d --- /dev/null +++ b/full_models/xer/vocab.txt @@ -0,0 +1,54 @@ +p +e +a +x +i +k +d +ó +2 +t +ô +ĩ +g +1 +c +ê +j +â +h +8 +l + +õ +n +ũ +é +ú +z +r +5 +w +v +u +í +0 +7 +9 +á +ẽ +ã +o +f +s +û +ø +b +- +3 +6 +q +_ +' +— +m diff --git a/full_models/xmm/D_100000.pth b/full_models/xmm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1c42938d5671b34e6f04829beda63c1acfda8e2d --- /dev/null +++ b/full_models/xmm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d1a589a4fd79a83c16fb16b6c3f26113155c1426b1044007eaf8b1c44fe51c1 +size 561078612 diff --git a/full_models/xmm/G_100000.pth b/full_models/xmm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..34051f6e37b3673cf50b4e7dd32973026e828005 --- /dev/null +++ b/full_models/xmm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa292b0fb03ea3a799abfdd67a0bf363dfb55535c9a4421874cb032823773e2 +size 436366660 diff --git a/full_models/xmm/config.json b/full_models/xmm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xmm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xmm/vocab.txt b/full_models/xmm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f92e5cf195116803fd002a5c6efaf1582b36ba6b --- /dev/null +++ b/full_models/xmm/vocab.txt @@ -0,0 +1,33 @@ +2 +4 +' +r +c +l +s +0 +z +a +j +m +y +o +d +n +i +f +b +e +h +t +6 +g +3 +u +_ +p +k +1 + +w +- diff --git a/full_models/xnj/D_100000.pth b/full_models/xnj/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a0a558d80b55e800c9c298653cfe3cc357f7b4dd --- /dev/null +++ b/full_models/xnj/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6ee4f75404d4336c577f5c251ef6e1fa974b2c9ac42e37192f9f8dca77ddf3 +size 561079265 diff --git a/full_models/xnj/G_100000.pth b/full_models/xnj/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c792199246d4d05f8dc22ffd023a87ab9c6c98be --- /dev/null +++ b/full_models/xnj/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36173edfa0000bec9eccd84d31bb8bdf9156e651172a4ebd20545e8a5789fed4 +size 436356056 diff --git a/full_models/xnj/config.json b/full_models/xnj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xnj/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xnj/vocab.txt b/full_models/xnj/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a21f1b9d58f54dbe6adb62e5f3153aea2c2a6cb7 --- /dev/null +++ b/full_models/xnj/vocab.txt @@ -0,0 +1,26 @@ +n +_ +f +p +o +w +k +v +y +a +i +j +h +e +c +z +d +u +t +' +l +b +s +m +g + diff --git a/full_models/xnr/D_100000.pth b/full_models/xnr/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ed2064fd8a03384c8e1cb6d1b153f8e78d25022 --- /dev/null +++ b/full_models/xnr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d562ad3aaded2cee7bcd7885577f246aea8f9f0223f506bef8882d8bb00d5de +size 561078726 diff --git a/full_models/xnr/G_100000.pth b/full_models/xnr/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f7e984b26df0286b0065176c4150bbc93ae40693 --- /dev/null +++ b/full_models/xnr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73f0acf3e7c76d21c698c4839d7da17205d7be331f4bda05cad2d95b842f8e6d +size 436432656 diff --git a/full_models/xnr/config.json b/full_models/xnr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xnr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xnr/vocab.txt b/full_models/xnr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d252a9264d5ffe068c1973eb6d0c10ee765d7efd --- /dev/null +++ b/full_models/xnr/vocab.txt @@ -0,0 +1,61 @@ +| +ा +े +् +ं +त +र +क +ह +ि +स +द +न +ी +ज +म +ल +य +प +ो +ु +ै +़ +ग +ण +ब +च +अ +आ +ई +ड +ऐ +ू +इ +ख +भ +थ +व +ए +श +ौ +ध +छ +फ +ठ +ट +झ +- +घ +ष +ऊ +उ +ओ +ढ +ँ +औ +ञ +ृ +' +— + diff --git a/full_models/xog/D_100000.pth b/full_models/xog/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..01d6fc4dd6663738e2de7343599a06a054491ceb --- /dev/null +++ b/full_models/xog/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52282c6ff966e72f41141f61fc6381713339cd01b0d6097d441223edd35afe6e +size 561078869 diff --git a/full_models/xog/G_100000.pth b/full_models/xog/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c3866eb9ff1a4c72bfc62fdccedd03982b491cb8 --- /dev/null +++ b/full_models/xog/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d572980559c655f81fa295d0333972cea90a14fe0521a7ee63f197ce4e2bd8 +size 436354183 diff --git a/full_models/xog/config.json b/full_models/xog/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xog/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xog/vocab.txt b/full_models/xog/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..08a77d56d5793cf11bbffb483e66249718f488cb --- /dev/null +++ b/full_models/xog/vocab.txt @@ -0,0 +1,26 @@ +y +a +m +s +f +k +h +o +_ +w +l +b +d +n +' +p +v +i +u +e +t +z +g + +j +r diff --git a/full_models/xon/D_100000.pth b/full_models/xon/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c55835cf213b1d227d9259c7852c71bba3be1280 --- /dev/null +++ b/full_models/xon/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b06d4833aeff023a773f42bac8157b342e68b73a534ac032f73621509a030e07 +size 561078702 diff --git a/full_models/xon/G_100000.pth b/full_models/xon/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..01257f3822c66e81f1f2973bb405baaac8945a42 --- /dev/null +++ b/full_models/xon/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033422a10f7dedf8778fcda124a050b6358f08630f7c612fc508cd16c6fb139c +size 436357665 diff --git a/full_models/xon/config.json b/full_models/xon/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xon/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xon/vocab.txt b/full_models/xon/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..5a72f97fda13cb64a3828372c7deda532891f2f3 --- /dev/null +++ b/full_models/xon/vocab.txt @@ -0,0 +1,29 @@ +| +a +i +n +u +b +k +e +m +l +t +ɔ +p +o +r +y +w +s +h +g +d +ŋ +j +c +f +- +' +v + diff --git a/full_models/xrb/D_100000.pth b/full_models/xrb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4f36a9e5716e5e7b27213033e3eaaa847503700e --- /dev/null +++ b/full_models/xrb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ddaeaeee361f1dc3d42c882fa3cfe8eabde6bd2b1cf816421dac60b4638a3b +size 561078761 diff --git a/full_models/xrb/G_100000.pth b/full_models/xrb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9e31f6032c5067669f985f716d13db1e2ad8fd89 --- /dev/null +++ b/full_models/xrb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df42d97026bcc392cfa81a1ec9cf3f19f54e8e094a86b76922dd5d423a7e0466 +size 436370155 diff --git a/full_models/xrb/config.json b/full_models/xrb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xrb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xrb/vocab.txt b/full_models/xrb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..13dcc93afa12b73ea82541d88b9efdfb3624c78d --- /dev/null +++ b/full_models/xrb/vocab.txt @@ -0,0 +1,34 @@ +| +a +e +y +n +ã +i +o +w +k +u +p +m +h +l +s +t +r +g +ĩ +b +ɛ +ẽ +f +d +ŋ +- +c +ũ +ɔ +̃ +' +j + diff --git a/full_models/xsb/D_100000.pth b/full_models/xsb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c5c4cd9b8bdb34a044130531933744529bea9279 --- /dev/null +++ b/full_models/xsb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2159f613e2b9bca470062fd622adae06f2aad3f659915e64df447da11f50bdcc +size 561078763 diff --git a/full_models/xsb/G_100000.pth b/full_models/xsb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..596f5c8248357247e6ef8dbd9b3b794c68eb9ab9 --- /dev/null +++ b/full_models/xsb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d534e44c50b1d488939c62bd68cbfb72b5cb7ae089f3d3bb2845a1a66370611 +size 436389789 diff --git a/full_models/xsb/config.json b/full_models/xsb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xsb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xsb/vocab.txt b/full_models/xsb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d09eae7d6b83dc2045ad9188d159e01e967569f4 --- /dev/null +++ b/full_models/xsb/vocab.txt @@ -0,0 +1,42 @@ +f +t + +2 +0 +à +ô +c +p +z +b +u +ñ +g +' +y +s +4 +î +e +á +1 +w +q +_ +6 +x +d +r +h +j +k +m +n +a +i +o +ó +- +l +v +â diff --git a/full_models/xsm/D_100000.pth b/full_models/xsm/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d67d76daf8aaca0a7c6494f9bcca21ce217927de --- /dev/null +++ b/full_models/xsm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd503f7e6819f422305b208db6518ece1095212c147e6de4be1fe5234ea40401 +size 561077870 diff --git a/full_models/xsm/G_100000.pth b/full_models/xsm/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9d243fcca9361e451443b999214bb590944db0e5 --- /dev/null +++ b/full_models/xsm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf2fcca6ab68b059d3bc05c86af5cbe19be3164789c5b6bc88a05617d52195f +size 436363937 diff --git a/full_models/xsm/config.json b/full_models/xsm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xsm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xsm/vocab.txt b/full_models/xsm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3285adcbc5cc11405920913701a4abf1a88047e9 --- /dev/null +++ b/full_models/xsm/vocab.txt @@ -0,0 +1,35 @@ +| +a +e +o +n +m +t +i +w +b +d +k +y +ɔ +r +l +g +s +ŋ +u +ɛ +- +p +á +j +z +h +c +é +ó +v +f +' +ǝ + diff --git a/full_models/xsr/D_100000.pth b/full_models/xsr/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b5ac35b605a544cc32ff8a5a82d46e57fce52217 --- /dev/null +++ b/full_models/xsr/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6350885e8254d1bc0bf61cbb9de910726cc0f71ebdda3637f062061cfe93b62f +size 561078614 diff --git a/full_models/xsr/G_100000.pth b/full_models/xsr/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..30215d4ffaf768c38d6015d4aedca8b922164989 --- /dev/null +++ b/full_models/xsr/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3891e09c68b6ceb091f6b9c5f8ba97be4c5e3d1e818ee0ca50dbfcdd0a4def4 +size 436422071 diff --git a/full_models/xsr/config.json b/full_models/xsr/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xsr/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xsr/vocab.txt b/full_models/xsr/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c5a605957951df68361e27af3280ca9fa71fddb4 --- /dev/null +++ b/full_models/xsr/vocab.txt @@ -0,0 +1,57 @@ +ठ +द +फ +ँ +ी +् +ओ +प +न +त +ट +श +ख +इ +ो +स +झ +ङ +ष + +ल +' +६ +भ +ौ +_ +ऊ +थ +उ +ड +क +ह +घ +ज +ै +ए +ू +छ +- +ि +व +ु +आ +ई +ा +ध +अ +ण +य +च +ग +ब +म +र +‍ +ं +े diff --git a/full_models/xsu/D_100000.pth b/full_models/xsu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..07dbd0d7a80d85ddbb98367da03f930fcd03af2b --- /dev/null +++ b/full_models/xsu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd0f2185aabe478d8063150b22f96f8df2cee5ac84797e9bd901f0fd1e7b1c67 +size 561076195 diff --git a/full_models/xsu/G_100000.pth b/full_models/xsu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..399229507180f3461d15bf39d49d3770c6157099 --- /dev/null +++ b/full_models/xsu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d16b4678727fd0aa0d55605484679e70b26faf313a2a7d9db43cff47f472b7 +size 436390364 diff --git a/full_models/xsu/config.json b/full_models/xsu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xsu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xsu/vocab.txt b/full_models/xsu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4b8a889d20557cef9535c64978dd54cb90f4c3e5 --- /dev/null +++ b/full_models/xsu/vocab.txt @@ -0,0 +1,51 @@ +| +a +ö +i +t +p +k +o +n +s +u +m +l +ĩ +e +h +ä +w +' +j +õ +ã +r +̃ +c +é +ẽ +d +0 +ó +b +á +v +ô +1 +í +7 +4 +2 +3 +ê +5 +f +ũ +g +ú +6 +8 +â +9 + diff --git a/full_models/xta/D_100000.pth b/full_models/xta/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1651724593364f921f2f367b29c6f751ae527ee9 --- /dev/null +++ b/full_models/xta/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:522d565048ffe6db4de42dffb6d4e4997491422e2a7e07243971e4ce985ad6eb +size 561076032 diff --git a/full_models/xta/G_100000.pth b/full_models/xta/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..da3a16f15b1d406052d2d0382cb2fa42b648040b --- /dev/null +++ b/full_models/xta/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f245f9f3a253888aa308daec7e0619388ec6162f2a2881126dd81c6074288a +size 436368289 diff --git a/full_models/xta/config.json b/full_models/xta/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xta/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xta/vocab.txt b/full_models/xta/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f4599c0d0142a0ae7ff29c4a39fc7913170ec128 --- /dev/null +++ b/full_models/xta/vocab.txt @@ -0,0 +1,42 @@ +s +d +m +u +_ +g +ó +ä +l +é +k +z +á +n +x +h +p +f +o +y +i +ú +c +q +r +ö +̱ +ǔ +e +v +ü +ꞌ +í +j +t +ǎ +b +ë +ñ +ï + +a diff --git a/full_models/xtd/D_100000.pth b/full_models/xtd/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c9381ee9cb77c361c4d4c718e67b8bb2519e3e18 --- /dev/null +++ b/full_models/xtd/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f2a8cecd2d7fbd710fa0df7a7a5ffac008031d4981e70a64d7f1dc6efd2493 +size 561079130 diff --git a/full_models/xtd/G_100000.pth b/full_models/xtd/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..dbe0d3246bab0c25c3fa5d0db81b395928476518 --- /dev/null +++ b/full_models/xtd/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f65465f9fc0167e270c26f3b8ebe9c8a495d3e526f3b92ecacf72bee932a56 +size 436381882 diff --git a/full_models/xtd/config.json b/full_models/xtd/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xtd/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xtd/vocab.txt b/full_models/xtd/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c60843d140225735c3286ae22ecb9e73a71822e2 --- /dev/null +++ b/full_models/xtd/vocab.txt @@ -0,0 +1,39 @@ + +ʼ +i +k +x +ɨ +ñ +h +c +n +ó +— +d +u +í +' +m +‐ +z +v +ú +e +g +j +y +f +q +é +o +b +á +́ +t +p +a +r +l +s +_ diff --git a/full_models/xte/D_100000.pth b/full_models/xte/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0aa74fbe3adeca06a4835836fb6f1d3882f2a7c1 --- /dev/null +++ b/full_models/xte/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700849f4f9ed94c8a665ee57c84f4fbcf17f15459a8378b7f524672c7cf15f2f +size 561076184 diff --git a/full_models/xte/G_100000.pth b/full_models/xte/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a5167c0dd6c1c0f13f3eeab28f3baefb37a09b45 --- /dev/null +++ b/full_models/xte/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:593af0bc1b13c5af48a5282602651fc71699eb84ff31c98607879ad8738b3a36 +size 436355894 diff --git a/full_models/xte/config.json b/full_models/xte/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xte/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xte/vocab.txt b/full_models/xte/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..838f3a49cc24b61283eebc30c881e7b7feecb5a6 --- /dev/null +++ b/full_models/xte/vocab.txt @@ -0,0 +1,36 @@ +h +4 +w + +r +0 +m +j +z +9 +l +p +5 +y +2 +a +b +7 +s +- +d +1 +u +f +o +i +e +t +c +_ +k +8 +g +n +6 +3 diff --git a/full_models/xtm/D_100000.pth b/full_models/xtm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9b999d52291b5dfd998af3ac97f67a46edec9f02 --- /dev/null +++ b/full_models/xtm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8490e57f14fd7d0fdc28f0b62e65a07177f8fb359b177ca672f7b1c82f954e40 +size 561078632 diff --git a/full_models/xtm/G_100000.pth b/full_models/xtm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3c30a275102a99bf1144d384cafbde83f5355174 --- /dev/null +++ b/full_models/xtm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121004ec85f0ba3cf2eb1486a56a1ead5ac37d93c6e9abb1c8a614d044ae2cf5 +size 436385073 diff --git a/full_models/xtm/config.json b/full_models/xtm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xtm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xtm/vocab.txt b/full_models/xtm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ba8e584961943e0ae9cbf16300a13e537035522e --- /dev/null +++ b/full_models/xtm/vocab.txt @@ -0,0 +1,41 @@ +â +i +m +e +r +‍ +v +j +á +d +t +û +f +' +‐ +k +u +y +ú +é +o +l +í +h +ó +n +x +î +z +c +_ +ñ + +q +b +p +w +a +g +ê +s diff --git a/full_models/xtn/D_100000.pth b/full_models/xtn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8e25b52f9f5beaab5b0b8c7409ab4c9570be7c72 --- /dev/null +++ b/full_models/xtn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e57eebb862dbfa9c9edc02859dcc5cc3a999df4204cf47eeceee4eba2fab97a +size 561078961 diff --git a/full_models/xtn/G_100000.pth b/full_models/xtn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2f7d8289ebee139c778e6f37c8d1037376144396 --- /dev/null +++ b/full_models/xtn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185609602fa639f0d67c32e86db364403300dc19c4b0d2278464bf5cce2b077c +size 436374044 diff --git a/full_models/xtn/config.json b/full_models/xtn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xtn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xtn/vocab.txt b/full_models/xtn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ac532c8652b395369a3081988e531b4ea77ccc6e --- /dev/null +++ b/full_models/xtn/vocab.txt @@ -0,0 +1,35 @@ +i +͏ +n +u +p +t +k +á +l +o +r +h +q +x + +v +e +m +s +j +ꞌ +ñ +_ +g +í +c +y +z +ó +a +d +b +f +ú +é diff --git a/full_models/xua/D_100000.pth b/full_models/xua/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..02fc7ac13b5241f0c1d6f788d73f4933e616bff5 --- /dev/null +++ b/full_models/xua/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac93620339250e0b29bda53536bdfb1da2144bf284a8247cf3d49f3270cf420 +size 561076018 diff --git a/full_models/xua/G_100000.pth b/full_models/xua/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9bc9dc6608dd00cab1db8b245629915d44579dbd --- /dev/null +++ b/full_models/xua/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9489d0f2ee6b044bcc204f4e07df1376c28e1dd0ec7f3cf0afb71c1dbafc23ad +size 436377528 diff --git a/full_models/xua/config.json b/full_models/xua/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xua/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xua/vocab.txt b/full_models/xua/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fc30ddaa4edf631cac04a82ebfc8bf18b3c2f670 --- /dev/null +++ b/full_models/xua/vocab.txt @@ -0,0 +1,46 @@ +ெ +ள +ூ +ஆ +ல +ஈ +இ +ற +ு +ச +ீ +ஓ +ை +ஹ + +அ +ம +ண +ா +உ +ஊ +ந +ே +- +_ +ஒ +த +ி +ழ +ஐ +் +ஞ +ன +ஸ +ப +ோ +வ +ட +ங +ஜ +ஏ +ொ +க +எ +ர +ய diff --git a/full_models/xuo/D_100000.pth b/full_models/xuo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..090bf7e74e9e20a3defc235dac6464ea1864043b --- /dev/null +++ b/full_models/xuo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183be65cba5bc94fce04f92a9bd4335d98d3f67a8d35f2a6fedf43c6d1a6f390 +size 561078742 diff --git a/full_models/xuo/G_100000.pth b/full_models/xuo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..48e179d6e1a393f5a760f359eead21eb1c7802c9 --- /dev/null +++ b/full_models/xuo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea0186715699c7fa00cca0e6962b752cdbb4ffc41eb86cc84437fed87c26bd6 +size 436410268 diff --git a/full_models/xuo/config.json b/full_models/xuo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/xuo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/xuo/vocab.txt b/full_models/xuo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..12566b2fe1c4668d176aac1609aa510214be7a38 --- /dev/null +++ b/full_models/xuo/vocab.txt @@ -0,0 +1,51 @@ +ě +_ +ḭ +é +̰ +k +ɓ +v +f +p +- +ù +e +ɗ +y +ú +à +n +ì +m +z +́ +b +d +ɔ +i +ǔ +ǐ +s +w + +ɛ +l +̌ +ǒ +h +o +t +í +á +r +' +ŋ +ṵ +u +ʼ +ó +g +ǎ +̀ +a diff --git a/full_models/yaa/D_100000.pth b/full_models/yaa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e87a6914862de6f7dcdbc2d3a6d671b320e4e6a6 --- /dev/null +++ b/full_models/yaa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0ab0c4eab60ea658c793ccde345441b5f6232b4ca44a38db4d4ff2d5c12ee4b +size 561078724 diff --git a/full_models/yaa/G_100000.pth b/full_models/yaa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b1021cd350d499f46971eb2c584e8f6426a7a283 --- /dev/null +++ b/full_models/yaa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2d961a8010f415dc67633c7e6fca0c4a9e8e7bee8bdab30e57591a100252f9 +size 436377176 diff --git a/full_models/yaa/config.json b/full_models/yaa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yaa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yaa/vocab.txt b/full_models/yaa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c786fcd842b80eb6b3fa3f0403b9f9e4e5481341 --- /dev/null +++ b/full_models/yaa/vocab.txt @@ -0,0 +1,37 @@ +a +| +i +o +k +n +f +s +e +m +ã +t +r +õ +x +p +h +y +ĩ +ẽ +c +j +ú +u +l +d +b +é +í +á +g +v +z +ó +q +ñ + diff --git a/full_models/yad/D_100000.pth b/full_models/yad/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..6c889127ee3672d57c5d56d19e0eb10aedd2ced0 --- /dev/null +++ b/full_models/yad/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d9ece7a288985e3a29ffa0aa154cbc7838ce7dadec54dc58c94115621a8bbb +size 561076154 diff --git a/full_models/yad/G_100000.pth b/full_models/yad/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4b27234fbdc84dd093e21e51c05535d008671f99 --- /dev/null +++ b/full_models/yad/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd71065da765a8cc2251b4c5744a298d1dffaf1e240e54c28e81fb94d8fb17fd +size 436341936 diff --git a/full_models/yad/config.json b/full_models/yad/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yad/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yad/vocab.txt b/full_models/yad/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..407296738da38a6c8d24fc8bf364d2ed4d2d5dbb --- /dev/null +++ b/full_models/yad/vocab.txt @@ -0,0 +1,30 @@ +a +| +i +y +̱ +u +r +j +t +n +d +s +v +e +m +c +h +o +ñ +b +p +q +ú +á +í +é +ó +l +g + diff --git a/full_models/yal/D_100000.pth b/full_models/yal/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..54b7f7bf4903f385b0b37f28f2a722d3062abd7b --- /dev/null +++ b/full_models/yal/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bae031f8f5f40b8b9a701a5d46bb8d45e428c13c2e263b96702d1d5112bd676 +size 561078847 diff --git a/full_models/yal/G_100000.pth b/full_models/yal/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..516746a2ed2be9f4eac38950704132320dc093f9 --- /dev/null +++ b/full_models/yal/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5851a8c4a6f3737229f965b69792dffd6739d40f210e0fbc3928de435cbd5b7 +size 436359200 diff --git a/full_models/yal/config.json b/full_models/yal/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yal/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yal/vocab.txt b/full_models/yal/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..476cdb9edd88fdea1825da012ce18b89f1c51ac9 --- /dev/null +++ b/full_models/yal/vocab.txt @@ -0,0 +1,29 @@ +| +a +n +i +e +x +y +m +ɛ +u +l +t +r +s +f +b +o +ɔ +d +k +g +ɲ +w +h +p +- +1 +c + diff --git a/full_models/yam/D_100000.pth b/full_models/yam/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f03c699b2634267e3269588db3e93453ec0d54b2 --- /dev/null +++ b/full_models/yam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ae37522ee5d41104737a2cd9f16749404a8040ea834152275bb3d0d8afd491 +size 561078726 diff --git a/full_models/yam/G_100000.pth b/full_models/yam/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..fdc02cbada5d0eddbfe58ed2e483ad3f33028ea5 --- /dev/null +++ b/full_models/yam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3a66d72429b05ac0bceac757428a788538157630b736c8e9c29b1e7b8f7f3a +size 436386250 diff --git a/full_models/yam/config.json b/full_models/yam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yam/vocab.txt b/full_models/yam/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f56e08604838f14278b8380d8015dd08d59b1906 --- /dev/null +++ b/full_models/yam/vocab.txt @@ -0,0 +1,41 @@ +| +ə +n +s +̀ +a +ŋ +w +m +y +à +k +e +o +' +ʉ +b +i +g +è +d +t +ò +f +u +v +p +l +ì +c +ɛ +z +r +h +j +ù +ʼ +- +ˋ +̍ + diff --git a/full_models/yao/D_100000.pth b/full_models/yao/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3d49d67030a61085123148c5401f2645a7f1f226 --- /dev/null +++ b/full_models/yao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944b7a8b47bb52b9a5cb015a717af7d599d8342382ce3b80fb480df1e13c6a7f +size 561078858 diff --git a/full_models/yao/G_100000.pth b/full_models/yao/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..10b0ce55c973e1aa7ce5f586ce530d1a261bf78a --- /dev/null +++ b/full_models/yao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4199d0de9722a698d27a59fa61ed78bc7f3a78e808bb6a619fa44d8095eea3b7 +size 436358578 diff --git a/full_models/yao/config.json b/full_models/yao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yao/vocab.txt b/full_models/yao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..aa58fad3e269a6dc33a54d7232ed4d42e92b994e --- /dev/null +++ b/full_models/yao/vocab.txt @@ -0,0 +1,28 @@ +g +_ +b +c +n +s +ŵ +j + +v +m +k +r +z +' +d +a +e +t +u +y +f +l +i +w +p +h +o diff --git a/full_models/yas/D_100000.pth b/full_models/yas/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4528193c68c5ae85f6fe87f456722822d0614f10 --- /dev/null +++ b/full_models/yas/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2274ce5fd8a66f5f127b888a1b2b7b69caca9c245569515f28876d5e72db27bf +size 561078861 diff --git a/full_models/yas/G_100000.pth b/full_models/yas/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ae01bcb5f9dfe464370ca3bb65b78750db2a769b --- /dev/null +++ b/full_models/yas/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c41ea261751434610a0093e33898e5e7278f130b58ef349cd71468218a968d +size 436365833 diff --git a/full_models/yas/config.json b/full_models/yas/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yas/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yas/vocab.txt b/full_models/yas/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9d5311083a18d8d522d0ae7b60e5104bbf5ee1ef --- /dev/null +++ b/full_models/yas/vocab.txt @@ -0,0 +1,31 @@ +ɛ +́ +b +i +p +l +t +h +m +é + +g +k +d +í +_ +ú +o +c +ŋ +u +e +– +ó +f +a +s +y +á +ɔ +n diff --git a/full_models/yat/D_100000.pth b/full_models/yat/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2ef74eaeb9d44edc352feec868a3df77c9e96758 --- /dev/null +++ b/full_models/yat/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:999d598ed8e0ed34a5bd210d7460c71107e3505dcfbd0a5cd57d817502d2ffae +size 561079264 diff --git a/full_models/yat/G_100000.pth b/full_models/yat/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..188f00966ff37de7219d2158988e04fe6ce5bdb9 --- /dev/null +++ b/full_models/yat/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24ee15f416eb116e2ba0563b0b8882682c67f7c3c8e5dc542e8f3eb20573b5b7 +size 436374971 diff --git a/full_models/yat/config.json b/full_models/yat/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yat/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yat/vocab.txt b/full_models/yat/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f1080b847a94ff6bd929fe9fad018698e9f01979 --- /dev/null +++ b/full_models/yat/vocab.txt @@ -0,0 +1,35 @@ +y +s +a +i +n +b +t +r +́ +l +_ +g +ɛ +d +ú +k +m +e +è +ɔ +c +á +u +f +ŋ +í +o + +p +ó +w +j +ʼ +ə +é diff --git a/full_models/yaz/D_100000.pth b/full_models/yaz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..67f00ba2c7902cd45aebe11c3464965f3c93301a --- /dev/null +++ b/full_models/yaz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bde19c1ac58e5bf6f2c1639747e28c79ef84688082c46706cd6940b46252438 +size 561078883 diff --git a/full_models/yaz/G_100000.pth b/full_models/yaz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4422ee7c31b0e1c97775d41b900c9477591aa35a --- /dev/null +++ b/full_models/yaz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7e84b8099d091849ec3162b32fca55b387a17a51c8c6dba61f231d021cd64b +size 436375766 diff --git a/full_models/yaz/config.json b/full_models/yaz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yaz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yaz/vocab.txt b/full_models/yaz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..448d06c102e2b21fb1ca98e663315f8d49e2b842 --- /dev/null +++ b/full_models/yaz/vocab.txt @@ -0,0 +1,35 @@ +h +ẹ +w +n +d +v +_ + +t +g +ọ +a +y +̀ +j +ì +l +à +z +i +- +ạ +' +ò +s +o +k +e +r +c +p +f +u +b +m diff --git a/full_models/yba/D_100000.pth b/full_models/yba/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d916d49b13b271b50676698f08f312e59387b3f0 --- /dev/null +++ b/full_models/yba/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d15f19d44b6043bafae0a6bcb16950ecd69fc3f5df549926245e95f718eabb +size 561078595 diff --git a/full_models/yba/G_100000.pth b/full_models/yba/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3e9cf453e4e9084bab1b9dd38adfb365ba6bd2ff --- /dev/null +++ b/full_models/yba/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc83c8a9bb879db7c36212f1ed1bcc28e9e23a84210d674fb3e3997c8436c170 +size 436373674 diff --git a/full_models/yba/config.json b/full_models/yba/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yba/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yba/vocab.txt b/full_models/yba/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a7306c19a499f7efec511583007e930057b0bd2f --- /dev/null +++ b/full_models/yba/vocab.txt @@ -0,0 +1,36 @@ + +ɛ +s +̄ +n +f +d +u +w +p +ā +m +b +_ +o +' +ɔ +r +j +l +a +ō +h +k +i +e +c +ū +ī +g +t +6 +- +y +ē +̍ diff --git a/full_models/ybb/D_100000.pth b/full_models/ybb/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..935d5217ac32b05467cc2ec85e3b8be7c6095401 --- /dev/null +++ b/full_models/ybb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46076f64ade759ce7a216753cd7cd3bb5748e65aad7ac7f66e24a33bd542546d +size 561078599 diff --git a/full_models/ybb/G_100000.pth b/full_models/ybb/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..0f4f6a356519873efd3c37e401bc21c382666d0d --- /dev/null +++ b/full_models/ybb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb069af5e0ebfd6e728918570bab76673aaf2e800a50da1f38a2c3fa2e90fa8 +size 436398672 diff --git a/full_models/ybb/config.json b/full_models/ybb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ybb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ybb/vocab.txt b/full_models/ybb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b261baa7202edfad6da4cf0ca18f7f1693b0d17a --- /dev/null +++ b/full_models/ybb/vocab.txt @@ -0,0 +1,46 @@ +| +e +ɔ +ŋ +ɛ +m +á +n +́ +a +t +p +é +ʼ +s +l +g +i +k +h +ʉ +w +z +̄ +y +í +d +u +ī +b +ú +ū +f +ā +j +o +ń +ē +ó +c +ō +ḿ +‐ +v +- + diff --git a/full_models/ycl/D_100000.pth b/full_models/ycl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4963a4700869eb59a9e670247e1979bfdcdaa18e --- /dev/null +++ b/full_models/ycl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2e0a67e4d874b886cfbe0682ce70b69df56fe17fa96a6dcb00f5e9244dc7427 +size 561079271 diff --git a/full_models/ycl/G_100000.pth b/full_models/ycl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7d8f0451e4c05ef7b3bb0559b276ee50fc2b2c4d --- /dev/null +++ b/full_models/ycl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf8247cc0c1596f8a0a9c5a5bf1898e6835a386c0b42379510c6f54110504d5 +size 436381982 diff --git a/full_models/ycl/config.json b/full_models/ycl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ycl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ycl/vocab.txt b/full_models/ycl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fec845e8fb45a3f6bfc6100d13de3e2e4a10390d --- /dev/null +++ b/full_models/ycl/vocab.txt @@ -0,0 +1,38 @@ +6 +h +0 +d +c +f +' +2 +v +i +o + +b +s +x +a +r +m +e +n +z +l +p +k +1 +- +3 +j +5 +g +t +y +q +_ +w +4 +9 +u diff --git a/full_models/ycn/D_100000.pth b/full_models/ycn/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..83106514f1d5682f969169e78bb20ba85f0527c1 --- /dev/null +++ b/full_models/ycn/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206cbdf674cab1781c9376b29ae0c379e70e2ae4c3065b5d1d5c8bec05c5e7f2 +size 561076194 diff --git a/full_models/ycn/G_100000.pth b/full_models/ycn/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..d7db9f4e6e29eddadd2d10a5b5cbc9a264029bec --- /dev/null +++ b/full_models/ycn/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7054143cd51340a8a143fb1de059c3edee1eba0469e042c680a3741cf45bbeb5 +size 436367322 diff --git a/full_models/ycn/config.json b/full_models/ycn/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ycn/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ycn/vocab.txt b/full_models/ycn/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9ec384c21e90f094c65d5d450550a5a2869910be --- /dev/null +++ b/full_models/ycn/vocab.txt @@ -0,0 +1,41 @@ +a +| +k +i +e +j +n +' +á +r +u +p +l +o +m +w +t +h +é +c +y +ú +ñ +ó +í +s +d +— +b +f +g +z +v +q +x +0 +- +4 +6 +1 + diff --git a/full_models/yea/D_100000.pth b/full_models/yea/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..62cd080f46c744e439e78ac53ea49952449f3bb4 --- /dev/null +++ b/full_models/yea/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e4cd9a4019226e3972cb2a47822587f65665828890d8f5d11f239a86d7b1543 +size 561078612 diff --git a/full_models/yea/G_100000.pth b/full_models/yea/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..317ef9b1f7883db4eaa4f823caa6afc98ba08d2c --- /dev/null +++ b/full_models/yea/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78cb7d43098267a6531071a855a1527d060b0583c22acc427134d5e24acb6ce5 +size 436398887 diff --git a/full_models/yea/config.json b/full_models/yea/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yea/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yea/vocab.txt b/full_models/yea/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3c29a10def9b097e5346575e7045c204c29ac230 --- /dev/null +++ b/full_models/yea/vocab.txt @@ -0,0 +1,47 @@ +ഓ +ാ +മ +ഞ +യ +ണ +അ +വ +ല +ഊ +ഉ +് +ക +േ +ഇ +െ +ട +ആ +ത +ര +ജ +ൊ +ഒ +ന +ഗ +ൂ +ദ +ബ +ു +ഈ +പ +ങ +‍ +ോ +ഏ +ീ +' +ച +ി +എ +— +ള +ഡ + +റ +ൺ +_ diff --git a/full_models/yka/D_100000.pth b/full_models/yka/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..30bba925f0fd737ffdb74f137df96e9533643a05 --- /dev/null +++ b/full_models/yka/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2807592aa66e55640115be193e06a00e647d862a2d0a90af265a79992204a8d +size 561078838 diff --git a/full_models/yka/G_100000.pth b/full_models/yka/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2b11db63c0c6b41ad6101be34dea63ca672bd1d4 --- /dev/null +++ b/full_models/yka/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05abe3e6d5530c2935777b1e9af7801a5e4a086070b7a3556aec40701431dc8a +size 436366066 diff --git a/full_models/yka/config.json b/full_models/yka/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yka/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yka/vocab.txt b/full_models/yka/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..7da36d826d8309bdc24a523461ad454adc21464b --- /dev/null +++ b/full_models/yka/vocab.txt @@ -0,0 +1,32 @@ +ō +c +n +w +i +s +t +ꞌ +h +k +j +ī +ū +r + +- +a +p +ē +ã +' +u +o +e +y +l +m +g +d +b +_ +ā diff --git a/full_models/yli/D_100000.pth b/full_models/yli/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bcab46e7cd7306d31248b46bef19779c0dd9654e --- /dev/null +++ b/full_models/yli/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79f698220314d6f7e20e3ff58e88a290bca7ba0245a353f45351969f6a5d655 +size 561078713 diff --git a/full_models/yli/G_100000.pth b/full_models/yli/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f517e4a94dd8128d4ea2c1d02d3adb2c0e5ab389 --- /dev/null +++ b/full_models/yli/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f67db6328adfdff2469b341503d0e86a6fe986096b6c6ff558f63ceb51feab2 +size 436352942 diff --git a/full_models/yli/config.json b/full_models/yli/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yli/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yli/vocab.txt b/full_models/yli/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..70e02360ba773621436c670b4cf9de617910ec65 --- /dev/null +++ b/full_models/yli/vocab.txt @@ -0,0 +1,27 @@ +| +a +n +e +i +u +o +h +g +l +m +t +r +k +s +w +p +b +f +y +d +- +' +z +j +c + diff --git a/full_models/yor/D_100000.pth b/full_models/yor/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a4d78eddc18e0db21485c3fe7d2c77d9b353b2f --- /dev/null +++ b/full_models/yor/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83968d8f97a16940ded68694ca69480bd30e787b9e5fd2d53f81889af1ddf054 +size 561079264 diff --git a/full_models/yor/G_100000.pth b/full_models/yor/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4f61410dbbc2bf78f8db1556f5da5f36b60eec4 --- /dev/null +++ b/full_models/yor/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2752787a4274049a9e3e07f6a704071c60cbf60673828f540604d8fc16daf296 +size 436394053 diff --git a/full_models/yor/config.json b/full_models/yor/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yor/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yor/vocab.txt b/full_models/yor/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..b3960d6d89df52efdac53b186d1f6378452a52d8 --- /dev/null +++ b/full_models/yor/vocab.txt @@ -0,0 +1,43 @@ +| +n +í +ọ +i +à +ẹ +t +a +r +b +ì +w +́ +l +̀ +k +á +s +ú +o +g +m +y +ó +p +u +e +j +ò +f +ṣ +é +d +è +ù +ń +h +- +ǹ +— +' + diff --git a/full_models/yre/D_100000.pth b/full_models/yre/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e038b02d031fe6ad8e4f809ad706cf56d60a5a3 --- /dev/null +++ b/full_models/yre/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6933adabcaa354a0920b5b797679cd19d475919eec16593e6b29aea07d3a37 +size 561078865 diff --git a/full_models/yre/G_100000.pth b/full_models/yre/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ea22b8fe637f0733172d40a20b2bc5af37fe9da7 --- /dev/null +++ b/full_models/yre/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee0a0d7b83fa592891b3eff9f4bf5fe720705d054a1b281081d8281f3b30450 +size 436367716 diff --git a/full_models/yre/config.json b/full_models/yre/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yre/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yre/vocab.txt b/full_models/yre/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cde515cdd2ea3bae45c280ebe850c27fcb4d0c07 --- /dev/null +++ b/full_models/yre/vocab.txt @@ -0,0 +1,32 @@ +s +_ +y +j +z +n +ɛ +f +a +c +r +v +' + +m +d +ɔ +t +h +p +o +ɩ +- +e +g +u +k +ʋ +l +w +i +b diff --git a/full_models/yua/D_100000.pth b/full_models/yua/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3f936c9cfe8c67658f83a4a9ed7f3224f0039b67 --- /dev/null +++ b/full_models/yua/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:147644c5b1298d1a15fae5cfa959ed19c698fc6301b7b7131428943a117492b1 +size 561078591 diff --git a/full_models/yua/G_100000.pth b/full_models/yua/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2be13a32834e8f8797b8d984e029ac8fe18f3ac9 --- /dev/null +++ b/full_models/yua/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d788f08b2a2046a7a8d5445ab5c7428c56bf3e013368a3b2c66ff1f7bb4b4a +size 436371260 diff --git a/full_models/yua/config.json b/full_models/yua/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yua/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yua/vocab.txt b/full_models/yua/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..48e000172125dc558f1bce7b462f57e5ef52e929 --- /dev/null +++ b/full_models/yua/vocab.txt @@ -0,0 +1,35 @@ +| +a +' +e +l +u +o +t +i +c +n +b +j +m +y +x +á +k +s +h +é +p +z +q +d +w +ú +ó +í +r +g +f +v +ñ + diff --git a/full_models/yuz/D_100000.pth b/full_models/yuz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..f4492e733d7e8492dccba4bf5a03997c01e48545 --- /dev/null +++ b/full_models/yuz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50596af6c659070b42d9fcce9ee67604580188cece0a3270b6db68f0127333fe +size 561078629 diff --git a/full_models/yuz/G_100000.pth b/full_models/yuz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..62f3ee6e43f5f0cfee347e495dc972e0ed9e36b4 --- /dev/null +++ b/full_models/yuz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1205ccad907ccb1ffa45a257dab785d0588605a7e23621ea47a15636a98262dc +size 436406347 diff --git a/full_models/yuz/config.json b/full_models/yuz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yuz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yuz/vocab.txt b/full_models/yuz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..245da674032fbf52c20671c3a2245383cd3658c6 --- /dev/null +++ b/full_models/yuz/vocab.txt @@ -0,0 +1,49 @@ +á +ä +í +l +u +' +h +2 +t +r +6 +i +e +ó +é +9 +‐ +b +n +a +ë +k +j +ñ +v +z +- +s +y +c +d +3 +o +x +q +f +1 +5 + +m +0 +_ +8 +4 +ü +ú +g +p +7 diff --git a/full_models/yva/D_100000.pth b/full_models/yva/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cda15adaf97c6112475201c1e8bb16e0eb0a9a8d --- /dev/null +++ b/full_models/yva/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4ace143fd6b946d0a7e76250134dedca8f6a621bd1dc8b24e944ed35881680 +size 561078633 diff --git a/full_models/yva/G_100000.pth b/full_models/yva/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..84c31844362fd9f1effe085b192a295d7a9681f9 --- /dev/null +++ b/full_models/yva/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71512e9930b8f22ffa7370407170f4eaefd9da1c13276613ef57efc767105c1 +size 436355147 diff --git a/full_models/yva/config.json b/full_models/yva/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/yva/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/yva/vocab.txt b/full_models/yva/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..31e463b5457d763e408cfbc39443e34b855f474c --- /dev/null +++ b/full_models/yva/vocab.txt @@ -0,0 +1,28 @@ +a +| +n +o +e +i +m +r +u +t +s +y +w +v +p +k +b +j +d +g +l +h +' +z +- +f +c + diff --git a/full_models/zaa/D_100000.pth b/full_models/zaa/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..a73510fee9df9e74e91b04cb8e26f9be487ad59c --- /dev/null +++ b/full_models/zaa/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b30d0b31359429b01d55a7abd09a5e6d1f3602655f191426f05df41fa264cb0d +size 561076570 diff --git a/full_models/zaa/G_100000.pth b/full_models/zaa/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c97475a42e03414aff3b2b26f0ce220581061388 --- /dev/null +++ b/full_models/zaa/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057b92603697aaf684a8a087deb5d7b4bbe71f09b309d3fc7ce8dc3951db718a +size 436401205 diff --git a/full_models/zaa/config.json b/full_models/zaa/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zaa/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zaa/vocab.txt b/full_models/zaa/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9ac8cd8f87dd4753f6a3df4bb1526a333ee8af0b --- /dev/null +++ b/full_models/zaa/vocab.txt @@ -0,0 +1,48 @@ +| +a +n +i +u +' +e +t +l +c +r +s +b +o +d +q +p +á +ą +h +g +í +y +à +m +é +ì +è +ỹ +į +ú +ù +j +x +f +ó +v +́ +z +ñ +ò +̀ +k +ü +̨ +ı +ẗ + diff --git a/full_models/zab/D_100000.pth b/full_models/zab/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..cacd2c46f826ff24bfe2eb99e318a9c52f002ad5 --- /dev/null +++ b/full_models/zab/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f72eb82727248c6308c2f0a7a8601e9209e4487851ed1e5872d7ed3d0307d7bb +size 561078834 diff --git a/full_models/zab/G_100000.pth b/full_models/zab/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..93d925617c9c292ce8ebdf7a0ca73c7eff0e9953 --- /dev/null +++ b/full_models/zab/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50924124a0fdda39451127c010bf7ea60910344d1ec4f9621b80830f1f80f615 +size 436378336 diff --git a/full_models/zab/config.json b/full_models/zab/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zab/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zab/vocab.txt b/full_models/zab/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..efcd938069197b9deb87edac2cc0b67c9d65b0c7 --- /dev/null +++ b/full_models/zab/vocab.txt @@ -0,0 +1,37 @@ +u +f +d +r +e +x +ó +v +j +ü +k +t +— +q +ú +l +z +á +m +n +_ + +é +ɨ +h +i +g +́ +s +y +b +ñ +í +o +p +a +c diff --git a/full_models/zac/D_100000.pth b/full_models/zac/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bcdb10096000ad947fa04ef8f6f3e084a973035f --- /dev/null +++ b/full_models/zac/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a44030174c0515790aa865c22392a7e196d5855cccf2e53cd239ec8ff8c5597 +size 561076145 diff --git a/full_models/zac/G_100000.pth b/full_models/zac/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c28b6d792913a0e8b1d343ed45f9aa923892a093 --- /dev/null +++ b/full_models/zac/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f288bdd62c0f58d69f8fc7fec23ab3ff5a9a4744f977746b4d79253e61c0ae +size 436354618 diff --git a/full_models/zac/config.json b/full_models/zac/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zac/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zac/vocab.txt b/full_models/zac/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dd5b4814dffb4bb44f67ad5c8dfcdb73276b9b17 --- /dev/null +++ b/full_models/zac/vocab.txt @@ -0,0 +1,36 @@ +á +f +_ +́ +q +u +ú +í +k +c +ü +j +e +y +a +s +p +i +o +d +é +z +v +ñ +b +ʼ +m +t +l + +r +h +g +ó +n +ë diff --git a/full_models/zad/D_100000.pth b/full_models/zad/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c6c5e670367eb9bfa33b31986f37ba0ae3ee2919 --- /dev/null +++ b/full_models/zad/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f5d48ec00968032d61a56dd9168ca320e3c8ac938cf9cc650e3250f8798dbb +size 561078623 diff --git a/full_models/zad/G_100000.pth b/full_models/zad/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..84ddafce1e4bdce32ea29e2f7a2b3dfe11b22c10 --- /dev/null +++ b/full_models/zad/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36deecedab99e5bc56e1ab0de53ffdbbc6ce9d5fc6ba8a956018b2d1c03ba9b2 +size 436382812 diff --git a/full_models/zad/config.json b/full_models/zad/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zad/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zad/vocab.txt b/full_models/zad/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..b126e914c7103e02b58bd8f4c3ab9456ae3c58df --- /dev/null +++ b/full_models/zad/vocab.txt @@ -0,0 +1,40 @@ +| +a +ꞌ +e +n +i +l +o +h +k +c +b +g +d +z +s +y +w +ṉ +t +ḻ +̱ +j +x +r +p +m +í +u +ə +ú +- +á +é +ó +f +v +q +ñ + diff --git a/full_models/zae/D_100000.pth b/full_models/zae/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e349447e716e64d250515f9342822c459aff152c --- /dev/null +++ b/full_models/zae/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c9f65c5c6f1007c323c0afd8e16e4cee66e0c92d15092a2b68ac2a7fb60ab76 +size 561078596 diff --git a/full_models/zae/G_100000.pth b/full_models/zae/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..403eae063ac7b6e9e0213a8918de053d79b5c2b9 --- /dev/null +++ b/full_models/zae/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf022cb0d9888a8e59fc4f2f59bcbf7fbeaa9b7325bc2ea0091469d9fe55ca8 +size 436375973 diff --git a/full_models/zae/config.json b/full_models/zae/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zae/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zae/vocab.txt b/full_models/zae/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..d9240b6e2993576af49871bf217c697c4de194c2 --- /dev/null +++ b/full_models/zae/vocab.txt @@ -0,0 +1,37 @@ +| +a +n +e +i +t +u +l +b +k +h +r +s +g +d +o +' +x +y +á +í +c +‐ +w +ú +m +p +j +é +f +ó +v +z +q +ñ +- + diff --git a/full_models/zai/D_100000.pth b/full_models/zai/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..54b82054c05cfc8499fb73aa5eca63a778054ecd --- /dev/null +++ b/full_models/zai/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0863e4922ac290503ba62178bee56f8b140caf5cd953220906c1a441256b985 +size 561078883 diff --git a/full_models/zai/G_100000.pth b/full_models/zai/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b814cf1d76e7da64d96a90d0791e5347e96491bc --- /dev/null +++ b/full_models/zai/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a6f8dc239c06f4475513fdb8b8b356bc629a8afec267ae3e3a4b579d607ae9 +size 436377747 diff --git a/full_models/zai/config.json b/full_models/zai/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zai/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zai/vocab.txt b/full_models/zai/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1c8f61e4af99d276ffbf186f00b994fbb3c595cb --- /dev/null +++ b/full_models/zai/vocab.txt @@ -0,0 +1,37 @@ +| +a +i +u +n +e +c +d +r +b +l +t +s +x +g +' +o +p +h +q +z +á +é +y +m +í +ñ +j +ú +ó +— +f +v +ü +k +- + diff --git a/full_models/zam/D_100000.pth b/full_models/zam/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f29573987a73e3be684766c892439a25d581926 --- /dev/null +++ b/full_models/zam/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7637b7899cbb7494b3273aa2422114f911d1bd54a0946fee40a51a92f42ea52b +size 561076065 diff --git a/full_models/zam/G_100000.pth b/full_models/zam/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..19d1ba726728ccebdc456f429dffc10dbe59a8bf --- /dev/null +++ b/full_models/zam/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5e4707b3f1018587a28ce13c7f6a63d08edbab079f86647cc6a1a5a4d7db69 +size 436366519 diff --git a/full_models/zam/config.json b/full_models/zam/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zam/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zam/vocab.txt b/full_models/zam/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..1d4e4975f62e5ebc954db455dddf072427d0b73b --- /dev/null +++ b/full_models/zam/vocab.txt @@ -0,0 +1,41 @@ +| +n +o +e +ꞌ +a +l +c +i +d +u +t +m +s +x +g +b +r +y +h +è +p +z +' +q +à +ó +j +ú +ì +ò +á +ñ +é +f +ù +í +v +ü +k + diff --git a/full_models/zao/D_100000.pth b/full_models/zao/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aa91d170e541c55f64412101ab45c71305ae4372 --- /dev/null +++ b/full_models/zao/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02f6360876175f777ff2166e1d497cd35400e14c7adfbfe7743c49c665bd7e0 +size 561078889 diff --git a/full_models/zao/G_100000.pth b/full_models/zao/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5e946cfc68c18b60c4698718dda3d86013511ef5 --- /dev/null +++ b/full_models/zao/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:145c244dbd08aa4b74876e7d7a3797ea72e40c1249b9cc551e8180090070dcbc +size 436372734 diff --git a/full_models/zao/config.json b/full_models/zao/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zao/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zao/vocab.txt b/full_models/zao/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..57910a8f87717919c0556fdd81d3192663edc48e --- /dev/null +++ b/full_models/zao/vocab.txt @@ -0,0 +1,35 @@ +o +t +e +j +_ +b +á +x +k +g +y +q +i +l +m +v + +u +s +n +w +a +é +ú +z +r +í +f +ʼ +p +ó +d +h +c +- diff --git a/full_models/zaq/D_100000.pth b/full_models/zaq/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..324b744756a176b33bb5f3ea24694858d6debc1b --- /dev/null +++ b/full_models/zaq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf2741a469f35401a1c1558349d76cd72f1e1ac119ceab6f76864caf1f9d9a8 +size 561078840 diff --git a/full_models/zaq/G_100000.pth b/full_models/zaq/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a419a75f623851d179651898ce3806a175cd0f8 --- /dev/null +++ b/full_models/zaq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6e3f5ac23463e872e15439716e96edbfe96676e6806714b6c76ca2f184f6837 +size 436399781 diff --git a/full_models/zaq/config.json b/full_models/zaq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zaq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zaq/vocab.txt b/full_models/zaq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..c84c1aa26723d6e85ed3cf8e71e74837c97777c0 --- /dev/null +++ b/full_models/zaq/vocab.txt @@ -0,0 +1,47 @@ +| +a +n +i +e +u +t +l +b +c +s +h +r +g +d +o +y +ꞌ +x +á +q +í +̱ +‐ +ú +m +p +j +ä +ü +- +é +f +ó +v +z +k +β +' +ο +ñ +ε +5 +ι +1 +8 + diff --git a/full_models/zar/D_100000.pth b/full_models/zar/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..530f57c5e1df96757765b708f83d3d7024ccf430 --- /dev/null +++ b/full_models/zar/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa427278c04a446ad8af8b4a056df2c184b8328d731b86b509e808e967725c1 +size 561079148 diff --git a/full_models/zar/G_100000.pth b/full_models/zar/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..9eec81900111978f00cc29b51bd72e351f26c0cf --- /dev/null +++ b/full_models/zar/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854995b730646a5bdc4c74baa2edbbd3fa634fe7879951a28ceb8d455a7cf1a8 +size 436386450 diff --git a/full_models/zar/config.json b/full_models/zar/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zar/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zar/vocab.txt b/full_models/zar/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0aec0684dfb82d5068de94b1f08415c2c174e822 --- /dev/null +++ b/full_models/zar/vocab.txt @@ -0,0 +1,40 @@ +g +t + +z +á +ö +ú +q +o +ž +é +ë +i +d +j +p +h +ü +x +l +ʼ +- +e +n +ǘ +ñ +ó +f +_ +í +a +m +v +́ +b +c +s +y +u +r diff --git a/full_models/zas/D_100000.pth b/full_models/zas/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3d42c4eae796f1991896dc09baf9713c2d41904f --- /dev/null +++ b/full_models/zas/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08cdb8222d6e071738e326b524c0c922f5ef1b10a29f1b3db6eab2e0d535e1b +size 561078585 diff --git a/full_models/zas/G_100000.pth b/full_models/zas/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8723aabb30ad9f9213dbb7c84c36ed6d00e5f7fe --- /dev/null +++ b/full_models/zas/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3fac067d775b400c72aaae11a0d5ecf5039bda21a3596c91e1d0647af9e1ac +size 436378295 diff --git a/full_models/zas/config.json b/full_models/zas/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zas/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zas/vocab.txt b/full_models/zas/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..eec44bec15fd5cb497406995feacc9768d8734c7 --- /dev/null +++ b/full_models/zas/vocab.txt @@ -0,0 +1,38 @@ +| +a +i +n +e +r +d +l +b +j +g +u +o +x +c +m +t +s +ë +z +' +y +p +h +ü +é +w +̱ +q +ú +á +v +f +ó +í +k +ñ + diff --git a/full_models/zav/D_100000.pth b/full_models/zav/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c65ff09fe7b14c89b4456b921de4aa6b6e2f0a65 --- /dev/null +++ b/full_models/zav/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa281264b8dae907619f5568d70ea3a6991e2efc35791e6b989641425b2302c +size 561076189 diff --git a/full_models/zav/G_100000.pth b/full_models/zav/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ae763883c13c58c156e9bbe59e203209352913a5 --- /dev/null +++ b/full_models/zav/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c598668b3733fe23564ff592f552248b64b540002cd75d5f0acac6c90c5874ad +size 436362587 diff --git a/full_models/zav/config.json b/full_models/zav/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zav/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zav/vocab.txt b/full_models/zav/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..69669397316eb5657416df54c09a568b34611af5 --- /dev/null +++ b/full_models/zav/vocab.txt @@ -0,0 +1,39 @@ +̱ +š +e +p +ɟ +f +h +i +ḻ +j +z +x +d +m +y +o +ɉ +ə +ṉ +ü +k +g + +c +ž +_ +ñ +q +a +' +l +u +— +r +t +n +w +b +s diff --git a/full_models/zaw/D_100000.pth b/full_models/zaw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..17e117460e3b96db12fb4d14794aeadbe40ec6b7 --- /dev/null +++ b/full_models/zaw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4c032a101a3886c9ff08b650c8450b4a00065536a7b9e6647e99ca505cd25b +size 561078701 diff --git a/full_models/zaw/G_100000.pth b/full_models/zaw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..aa3ba25e619ec3237a2e8e0c81ff410829483246 --- /dev/null +++ b/full_models/zaw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6178c5692568dad041e2e0e3a372537805c4c3f4fb0f55cb91dc3440e41afa0b +size 436391847 diff --git a/full_models/zaw/config.json b/full_models/zaw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zaw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zaw/vocab.txt b/full_models/zaw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ea38978d500d93a1e49a0979a9d6badc36b9b5b8 --- /dev/null +++ b/full_models/zaw/vocab.txt @@ -0,0 +1,44 @@ +| +i +a +n +e +u +j +r +c +d +l +s +x +t +g +o +b +ä +ꞌ +h +z +ṉ +p +ḻ +y +m +ú +w +q +é +f +- +ṟ +í +̲ +ó +́ +á +v +' +k +ñ +ü + diff --git a/full_models/zca/D_100000.pth b/full_models/zca/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..7a6a5a5f8ff9e21e60db94e0cfe0787263fdff3e --- /dev/null +++ b/full_models/zca/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c73d9f712cb491dece5eb4b727ea14602ecbb17b5c35901aee8f21f983ad88 +size 561076192 diff --git a/full_models/zca/G_100000.pth b/full_models/zca/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2e0f0d5ae19629dbb4600dbc1b89548605e8f659 --- /dev/null +++ b/full_models/zca/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531826e273fb050c4f3b7f2951a5eaa7a7d4663c8362b88dd76853b7a81f35b2 +size 436365223 diff --git a/full_models/zca/config.json b/full_models/zca/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zca/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zca/vocab.txt b/full_models/zca/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..e904d26e59c6c0e7cd6fdab29ce21d3f85f6d010 --- /dev/null +++ b/full_models/zca/vocab.txt @@ -0,0 +1,40 @@ +| +a +n +ꞌ +i +o +e +l +r +k +z +h +m +x +b +s +u +g +t +d +ë +p +w +y +c +j +ú +ñ +á +é +f +ó +í +v +̱ +q +- +— +' + diff --git a/full_models/zga/D_100000.pth b/full_models/zga/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4e31d6422bbe331cf76224c36b3dbf0f0a10e4e1 --- /dev/null +++ b/full_models/zga/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db90481ef1395895ddcf70f44aeaa3021d06fca66e52ed565d8c3b82cf3e5df3 +size 561078983 diff --git a/full_models/zga/G_100000.pth b/full_models/zga/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..74e4599edea18fc40a6c568321e3e254176ebe01 --- /dev/null +++ b/full_models/zga/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057078637e093a1cfcbd3aa9f2d9242c5d97e0d14781f59383477d43ac7c97d2 +size 436360341 diff --git a/full_models/zga/config.json b/full_models/zga/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zga/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zga/vocab.txt b/full_models/zga/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a3b1bb20d046af2b28c78750390eb62fd8cdd4ed --- /dev/null +++ b/full_models/zga/vocab.txt @@ -0,0 +1,29 @@ +g +u + +v +ʉ +p +k +f +m +_ +e +y +ʼ +s +a +z +j +n +d +- +o +l +w +t +i +ɨ +b +h +' diff --git a/full_models/zim/D_100000.pth b/full_models/zim/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..24d9d01fd8f5e2afb3dc0be86eb97f251bab33f4 --- /dev/null +++ b/full_models/zim/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29c98bae4a6d7f110d5c098690fa5d5f77667154bd35dd09d68810699197951 +size 561078851 diff --git a/full_models/zim/G_100000.pth b/full_models/zim/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..5406e644be2b9e3f67915e5a705f4b410876402a --- /dev/null +++ b/full_models/zim/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d547245d5c074a9c77a64b625fa545272911d01bc87669c3e7064e2e538f6fb2 +size 436390650 diff --git a/full_models/zim/config.json b/full_models/zim/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zim/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zim/vocab.txt b/full_models/zim/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..375cb2c58b1d102a722c623352df9305ef8b1b4c --- /dev/null +++ b/full_models/zim/vocab.txt @@ -0,0 +1,42 @@ +v +ï +k +ù +ʼ +û +a +c +l +w +g +t +z +h +m +s +' +j +á +u +n +p +f +ô +- + +â +î +_ +ú +r +i +o +d +y +b +à +ê +e +— +ˮ +é diff --git a/full_models/ziw/D_100000.pth b/full_models/ziw/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..092ac4db8802012920516e58d4d1bd055d355de7 --- /dev/null +++ b/full_models/ziw/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe297d3e5ec731910302c27819528b96161a64a5361c9ad5fba0f40d7a5f2e14 +size 561079104 diff --git a/full_models/ziw/G_100000.pth b/full_models/ziw/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ec3014ea2f805613ac1d13f27eefb42350a74c22 --- /dev/null +++ b/full_models/ziw/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b411ec63b093f6430041e3d60ccd3f593aab7f43bfb22b968e435153e512ded5 +size 436354321 diff --git a/full_models/ziw/config.json b/full_models/ziw/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ziw/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ziw/vocab.txt b/full_models/ziw/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..013c44bf3448611891a929859a703a89a82e2f69 --- /dev/null +++ b/full_models/ziw/vocab.txt @@ -0,0 +1,26 @@ +a +' +j +g +w +e +c +u + +t +_ +f +l +s +h +i +v +d +p +m +k +z +y +n +b +o diff --git a/full_models/zlm/D_100000.pth b/full_models/zlm/D_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5ecd6cbbfc4e6d525233626be9dcc18c27f4663 --- /dev/null +++ b/full_models/zlm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd772bc8002235ad832f63cec16c3b5a1faff11eef915d8ea50dbce2ae55e38 +size 561110657 diff --git a/full_models/zlm/G_100000.pth b/full_models/zlm/G_100000.pth new file mode 100644 index 0000000000000000000000000000000000000000..0ee18da5149a49c9b8f3e0760f9d6d7d5067755d --- /dev/null +++ b/full_models/zlm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7773897c01982b556cd4c0a4a911ccb41c386891d712b25f2e7536e3363aa5f2 +size 436609829 diff --git a/full_models/zlm/config.json b/full_models/zlm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zlm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zlm/vocab.txt b/full_models/zlm/vocab.txt new file mode 100644 index 0000000000000000000000000000000000000000..c5341cfc6ff6909a2ddd466155ceca187613838e --- /dev/null +++ b/full_models/zlm/vocab.txt @@ -0,0 +1,34 @@ +y +g + +f +e +t +o +5 +j +_ +3 +k +– +i +a +0 +n +6 +d +u +c +' +h +q +- +p +m +w +r +4 +s +l +b +z diff --git a/full_models/zmz/D_100000.pth b/full_models/zmz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e30e056d245e36d591d60c99c7757edfaa31e4bd --- /dev/null +++ b/full_models/zmz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c492635d4d9c00486de67e6b0f2b27c6c06826da4add95991dad3ead42021cb +size 561079021 diff --git a/full_models/zmz/G_100000.pth b/full_models/zmz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..da4bd54c0f6fdb710985a8c5670dd21ef992eeb5 --- /dev/null +++ b/full_models/zmz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:683f9a5d7689bf8fa640d24a48c6318739b5a8edb94a3582446afb3d9fb5926d +size 436427495 diff --git a/full_models/zmz/config.json b/full_models/zmz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zmz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zmz/vocab.txt b/full_models/zmz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f8b3728749a2c2d2beef3086ab16f87e4e66770a --- /dev/null +++ b/full_models/zmz/vocab.txt @@ -0,0 +1,58 @@ +ú +j +ã +ʉ +à +k +ẽ +1 +n +g +o +v +3 +u +2 +e +d +ɔ +ù +7 +ì +p +6 +ò +œ +4 +- +í +ũ +_ +l +́ +i +t +r + +ó +s +õ +9 +0 +é +' +a +z +5 +m +w +8 +y +̀ +b +ĩ +̃ +h +f +è +á diff --git a/full_models/zne/D_100000.pth b/full_models/zne/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2370cc0ff6a27244236e083193522ef022e3e04a --- /dev/null +++ b/full_models/zne/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c127688f93b1f7dd7bf54b4fbac5dafae1a83aba0be9132d129e217795325a +size 561079006 diff --git a/full_models/zne/G_100000.pth b/full_models/zne/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c159c905212f04fdcccfbb021822cfa87fab2b81 --- /dev/null +++ b/full_models/zne/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:709dc8bdcc9e28ca7eefc2d2dd7eb03da60e7f212780b6e0421b3cf37fb5ef8e +size 436380548 diff --git a/full_models/zne/config.json b/full_models/zne/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zne/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zne/vocab.txt b/full_models/zne/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..41b6c316fc14bf9dcb28149c3f66a40cf9898f48 --- /dev/null +++ b/full_models/zne/vocab.txt @@ -0,0 +1,38 @@ +û +ĩ +k +b +z +o +ò + +p +r +d +f +ã +m +ä +0 +i +t +ô +y +s +g +e +4 +v +ũ +2 +u +õ +a +ẽ +n +â +_ +h +w +- +ì diff --git a/full_models/zos/D_100000.pth b/full_models/zos/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..737e55896d3227327576c1c9be2422655aed6d37 --- /dev/null +++ b/full_models/zos/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea687823045af1810ab4ca28d7fde4d8e7e70e0d1e86334e40f4e38cf84c19ec +size 561078726 diff --git a/full_models/zos/G_100000.pth b/full_models/zos/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..57b3fa207620efd289ec973442c6404372cc479b --- /dev/null +++ b/full_models/zos/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f17872a24d8188873f5c7cae6c16b0bc46c8a86e48001b17eb2d06bddf1b6e6 +size 436380538 diff --git a/full_models/zos/config.json b/full_models/zos/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zos/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zos/vocab.txt b/full_models/zos/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..3f471cfb66dc5076bc9d1b85cec2271fceb2f35b --- /dev/null +++ b/full_models/zos/vocab.txt @@ -0,0 +1,38 @@ +u +m +é +x +s +f +y +n +t +q +á +c +ö +e +' +a +d +ó +p +o +í +ü +v +b +ø +r +ú +ñ +h +j +z +i +_ +g + +k +ṉ +l diff --git a/full_models/zpc/D_100000.pth b/full_models/zpc/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..61b3d51be92b091ff50e43897cfa053325d1d564 --- /dev/null +++ b/full_models/zpc/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e888ae54c622cd65dc61ec0cefd6945acf45939bf4065eb23876729e46988a5f +size 561078881 diff --git a/full_models/zpc/G_100000.pth b/full_models/zpc/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0d33e34e9820ea0b77ad61865853591f12981aeb --- /dev/null +++ b/full_models/zpc/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e03d7788e048e1fe78e77034e2d87d40510bb08eb824caee166ee335a716ba99 +size 436383735 diff --git a/full_models/zpc/config.json b/full_models/zpc/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpc/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpc/vocab.txt b/full_models/zpc/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..dae74619cb47fdf7c0242537db3558a8893ca3cd --- /dev/null +++ b/full_models/zpc/vocab.txt @@ -0,0 +1,39 @@ +n +y +r +ꞌ +c +s +p +t +u +l +o +k +m +v +̃ + +ó +ú +a +f +j +í +­ +x +á +q +_ +ë +b +g +é +ü +h +i +z +ñ +' +d +e diff --git a/full_models/zpg/D_100000.pth b/full_models/zpg/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b9b31e821e1037c67487562ae631de042c901ae0 --- /dev/null +++ b/full_models/zpg/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971598d8661310ecd53c1f23be64e7243deecb26bebd3b43087e4f6e29ca2cd8 +size 561079101 diff --git a/full_models/zpg/G_100000.pth b/full_models/zpg/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..8735a8ec144687b5ca19ba551c7fe8a00df6d8ab --- /dev/null +++ b/full_models/zpg/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c499159f20f8c7776213133548998530da744b66ff4da8df8ed083bd6945c8e +size 436401190 diff --git a/full_models/zpg/config.json b/full_models/zpg/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpg/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpg/vocab.txt b/full_models/zpg/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0979f8c4fdf420d72cce8d18419f36445693f038 --- /dev/null +++ b/full_models/zpg/vocab.txt @@ -0,0 +1,46 @@ +| +e +i +a +n +o +d +y +l +u +z +m +r +g +h +ñ +t +ꞌ +b +c +x +s +p +â +- +w +ü +q +î +ó +é +ḻ +j +‐ +ú +ṉ +í +ṟ +f +á +v +ê +ô +û +k + diff --git a/full_models/zpi/D_100000.pth b/full_models/zpi/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..2331091840253cedee32a53e6340f2eec3c45f76 --- /dev/null +++ b/full_models/zpi/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c5695fb2aebcedfb264cf176759e5eb06730af35af69f5187984dc2bb4f7f3a +size 561078607 diff --git a/full_models/zpi/G_100000.pth b/full_models/zpi/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..05cb67b3dde94e5958834ae5d05727c22c6d43da --- /dev/null +++ b/full_models/zpi/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04aeb7bc2a5dc8ddd4843f21d78714eb391ad970d3f06c6660567f7947c457f7 +size 436376092 diff --git a/full_models/zpi/config.json b/full_models/zpi/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpi/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpi/vocab.txt b/full_models/zpi/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..fc6a49a0fe9857f6d0900b7395084c2916299cd2 --- /dev/null +++ b/full_models/zpi/vocab.txt @@ -0,0 +1,37 @@ +| +e +n +a +o +l +d +r +y +i +u +m +t +g +z +k +x +s +w +b +p +h +ë +c +é +j +- +f +á +í +ó +v +́ +q +ú +ñ + diff --git a/full_models/zpl/D_100000.pth b/full_models/zpl/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..e1fca631b7fa8b81b5ccc499ecaf957a3b0d404e --- /dev/null +++ b/full_models/zpl/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9772da0f8d2a159c37564785d286177042727df963e0329c1bb39bf6aba5ee03 +size 561078621 diff --git a/full_models/zpl/G_100000.pth b/full_models/zpl/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..83bb35c5a134216d8ecee90f047101574a768e99 --- /dev/null +++ b/full_models/zpl/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f7e185051a4f1f8442ef3f48217fdd1dec6ab1c08e7b860908d9105ce552e40 +size 436371270 diff --git a/full_models/zpl/config.json b/full_models/zpl/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpl/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpl/vocab.txt b/full_models/zpl/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a3439fc65d1a887fdbb3278f8cbac447bc958500 --- /dev/null +++ b/full_models/zpl/vocab.txt @@ -0,0 +1,35 @@ +a +c +l +ñ +ü +i +r +ó +e +j +o +b +u +p +n +g +h +v +k +t +x +í +d +' +y +q +_ +é + +á +m +ú +z +s +f diff --git a/full_models/zpm/D_100000.pth b/full_models/zpm/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c01b421c82c19149bea194b80eb16893a902ff18 --- /dev/null +++ b/full_models/zpm/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:471125d642b99727a6b0f78e7fce81c165952cb10dea8b77a570d2f10b49aed5 +size 561078725 diff --git a/full_models/zpm/G_100000.pth b/full_models/zpm/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..c2ee42ffd889e9b12f8a582c29d845c2c2d247c2 --- /dev/null +++ b/full_models/zpm/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53dbc90bd0827c9d94c49630cea9909539e9fc4a7407b5a7447bb30380b361ad +size 436385088 diff --git a/full_models/zpm/config.json b/full_models/zpm/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpm/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpm/vocab.txt b/full_models/zpm/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..9801f43200634e9bf1e60534533bc620f4359222 --- /dev/null +++ b/full_models/zpm/vocab.txt @@ -0,0 +1,41 @@ +w +u +f +j +' +e +é +ü +_ +p +o +á +b +ó +m +t +ñ +k +l +‐ +v +q +n +ṉ +d +y +r +í +ḻ +x +ú +- +ë +i +s +h +a +g +z + +c diff --git a/full_models/zpo/D_100000.pth b/full_models/zpo/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..099ae86a58a8ea68badc8dde4963f17a8e9cc9f8 --- /dev/null +++ b/full_models/zpo/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abba19f308e45453515245528d4ab330afb781c681793cdcbd0f05072f489b76 +size 561079130 diff --git a/full_models/zpo/G_100000.pth b/full_models/zpo/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..3afbe7cfce9b6801c9f9db3879869fa8d640ec37 --- /dev/null +++ b/full_models/zpo/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fafb4836f36c205ea25f5efa46d3070ffac34dcde3c26c2fafabd3e756616f09 +size 436404023 diff --git a/full_models/zpo/config.json b/full_models/zpo/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpo/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpo/vocab.txt b/full_models/zpo/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..f65f11f4ed1a6154cfbcd18684d278a449170b20 --- /dev/null +++ b/full_models/zpo/vocab.txt @@ -0,0 +1,47 @@ +- + +_ +3 +c +t +n +i +a +ú +7 +q +é +8 +m +2 +á +9 +v +k +y +u +r +6 +e +l +' +x +j +ñ +f +h +b +s +í +ó +p +g +o +— +4 +w +z +1 +5 +0 +d diff --git a/full_models/zpt/D_100000.pth b/full_models/zpt/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b61180b1c51cace9a81fe3f31717b4d65ce96786 --- /dev/null +++ b/full_models/zpt/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73429fcb51cdfb7bf37c3da03a760aba256e81b0402f168f68c9ba8781dbaabd +size 561079134 diff --git a/full_models/zpt/G_100000.pth b/full_models/zpt/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..269ca07f580df6f0e0e40aa0b69c23f527cfe3f7 --- /dev/null +++ b/full_models/zpt/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8d1c0e6558938369fba10c8fb12fe823e2cc43784027a6c0e06a34573dbda66 +size 436381792 diff --git a/full_models/zpt/config.json b/full_models/zpt/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpt/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpt/vocab.txt b/full_models/zpt/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..380db342639a6bdbd8733796d6b14c6454140100 --- /dev/null +++ b/full_models/zpt/vocab.txt @@ -0,0 +1,38 @@ +ñ +c +k + +ó +ꞌ +u +w +ú +i +' +t +f +j +q +b +í +d +_ +r +y +e +á +n +h +m +l +‐ +a +o +p +v +s +g +z +— +é +x diff --git a/full_models/zpu/D_100000.pth b/full_models/zpu/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..ca438a7a1db828ee6e2085137be6cf5186367229 --- /dev/null +++ b/full_models/zpu/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2245d50315aa6c318aab169727ae1d266f08774db3715fff11d0bb5bdea01a2 +size 561078625 diff --git a/full_models/zpu/G_100000.pth b/full_models/zpu/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..70a3c7fc43294210d60a063dcd52c70cdd63807e --- /dev/null +++ b/full_models/zpu/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5a926f1564b44806f4f4a3bdf9dc0c4428cf34e04fe3760ba0739c4f390a4ee +size 436376011 diff --git a/full_models/zpu/config.json b/full_models/zpu/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpu/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpu/vocab.txt b/full_models/zpu/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..a19e3b62e5202b8fdb52ec90370b2148b322a0c3 --- /dev/null +++ b/full_models/zpu/vocab.txt @@ -0,0 +1,37 @@ +a +g +- +á +b +ñ +i +í +t + +f +' +l +— +d +z +p +s +j +ú +x +n +w +q +r +u +_ +v +é +h +e +k +o +c +m +ó +y diff --git a/full_models/zpz/D_100000.pth b/full_models/zpz/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..bae0553d80612d32f9205590216dbcb5ec25bda0 --- /dev/null +++ b/full_models/zpz/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f323c0db458e61870984eea69037ad9ff5e8018abec8432856d56fc6558e4b3 +size 561078718 diff --git a/full_models/zpz/G_100000.pth b/full_models/zpz/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..b07b0c1b0eeab3e3417165be05e97fa503fcc46f --- /dev/null +++ b/full_models/zpz/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27419cf9ad37042981622a59872f5f9266bfcd54d3852c5cd000f8a336414ab0 +size 436375978 diff --git a/full_models/zpz/config.json b/full_models/zpz/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zpz/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zpz/vocab.txt b/full_models/zpz/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..ef859c0afee46ee143674aa96a2904b892a7c9ad --- /dev/null +++ b/full_models/zpz/vocab.txt @@ -0,0 +1,37 @@ +ñ +z +s +é +e +g + +t +m +o +ü +r +j +q +k +a +i +' +b +c +̱ +l +_ +p +h +á +v +w +ú +y +ó +í +f +u +d +n +x diff --git a/full_models/ztq/D_100000.pth b/full_models/ztq/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..034d840781a91ab3087474ac093645df73818b1d --- /dev/null +++ b/full_models/ztq/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02a358995e0cdce52510f6f6307de8449ae9c45db2ff4dd269c0580f04efd605 +size 561079395 diff --git a/full_models/ztq/G_100000.pth b/full_models/ztq/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1478b67636dcb0030a1a05db21bf2855ae3591ad --- /dev/null +++ b/full_models/ztq/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bdeb67ba4bb953e91ca338e9c652b7b3354aec1b6e48ae40f368248369dd661 +size 436380705 diff --git a/full_models/ztq/config.json b/full_models/ztq/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/ztq/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/ztq/vocab.txt b/full_models/ztq/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..4c97efbb961d859c07e2dad71ecc8d555d8a487e --- /dev/null +++ b/full_models/ztq/vocab.txt @@ -0,0 +1,36 @@ +ó +ë +f +í +z +x +p + +ú +k +n +m +— +w +s +a +j +u +v +_ +e +g +d +t +ñ +o +q +l +y +r +b +á +é +c +i +h diff --git a/full_models/zty/D_100000.pth b/full_models/zty/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..4d89ad8715eb769e096342027a8f5cbb47c3b3fa --- /dev/null +++ b/full_models/zty/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e6fe30beca31355ac9e96b8eeee6934414e6b38428bb7f4072c3faa63ebad07 +size 561078626 diff --git a/full_models/zty/G_100000.pth b/full_models/zty/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..66de022f652630e68929ac95ab0094ef758eb480 --- /dev/null +++ b/full_models/zty/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a103ebf86642ed1ef0345bf8d9355e95bba6c5d5d7137c237fbbf1a566c6a7f +size 436380336 diff --git a/full_models/zty/config.json b/full_models/zty/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zty/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zty/vocab.txt b/full_models/zty/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..08872d2be1837caeba18d584cebc7af7f0a58401 --- /dev/null +++ b/full_models/zty/vocab.txt @@ -0,0 +1,39 @@ +í +̱ + +é +á +ẕ +ó +d +i +c +u +b +p +n +t +k +m +g +o +ḻ +l +r +- +_ +' +h +w +x +e +z +ž +j +ú +a +y +f +s +ñ +— diff --git a/full_models/zyb/D_100000.pth b/full_models/zyb/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..295e32d4d42b15f79b258b0dea5a9c076bf26a57 --- /dev/null +++ b/full_models/zyb/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9598e02d9667557198acbab8922c783ac9410b4ca19413965788fcac4daab272 +size 561078863 diff --git a/full_models/zyb/G_100000.pth b/full_models/zyb/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..399f2781123ec4eee41b8580a1ebec1254c33d9a --- /dev/null +++ b/full_models/zyb/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d119177bca119090d7931cd90e1cb5367cf747826b1c431567c50a17ea1eb0e +size 436364962 diff --git a/full_models/zyb/config.json b/full_models/zyb/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zyb/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zyb/vocab.txt b/full_models/zyb/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..994a74036a428e1f7461534c7b3206f827d26438 --- /dev/null +++ b/full_models/zyb/vocab.txt @@ -0,0 +1,31 @@ +| +n +e +a +g +i +h +u +o +j +d +z +q +w +m +c +b +s +y +x +l +v +r +f +k +t +' +p +— +- + diff --git a/full_models/zyp/D_100000.pth b/full_models/zyp/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..92be86306940ffcbd420817f84870f6a32cebb59 --- /dev/null +++ b/full_models/zyp/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17bc3794734181d32642a0b5bd92086122f84afb437f7526e1aa548eb883a2b3 +size 561078502 diff --git a/full_models/zyp/G_100000.pth b/full_models/zyp/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..efa16e730ddbbb9ca5cab2a0bfd1b167829e9457 --- /dev/null +++ b/full_models/zyp/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35c64d8eb823754395165c436b3e2ad19ca49205d3e41b6c107cafb7844ffd6b +size 436384873 diff --git a/full_models/zyp/config.json b/full_models/zyp/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zyp/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zyp/vocab.txt b/full_models/zyp/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..cb3750662cc5f1dc4d75ace43243ba998b8af055 --- /dev/null +++ b/full_models/zyp/vocab.txt @@ -0,0 +1,41 @@ +| +a +h +n +i +t +e +g +w +c +l +k +u +p +o +s +m +r +y +z +b +v +d +á +j +f +- +0 +é +1 +2 +4 +í +5 +6 +ú +3 +7 +ó +' + diff --git a/full_models/zza/D_100000.pth b/full_models/zza/D_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..0c4f9404ed1aaee4f4639daf2ef9b90b15a62ffe --- /dev/null +++ b/full_models/zza/D_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5ab86bbd0b3fd15d9d9a8dd29f0a2bc6fb9983f0fbf1b4d0dbe4538d0712169 +size 561076147 diff --git a/full_models/zza/G_100000.pth b/full_models/zza/G_100000.pth new file mode 100755 index 0000000000000000000000000000000000000000..1b581b50eeded7b1c0640b90b3959058c5fec57d --- /dev/null +++ b/full_models/zza/G_100000.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7338052d9d9208bfdca6d664269b3994b4b047c461f32ddfdb8974bc936693 +size 436352816 diff --git a/full_models/zza/config.json b/full_models/zza/config.json new file mode 100644 index 0000000000000000000000000000000000000000..183f6cf4aa2db779aed3ddadc188bbb02e860690 --- /dev/null +++ b/full_models/zza/config.json @@ -0,0 +1,87 @@ +{ + "train": { + "log_interval": 200, + "eval_interval": 1000, + "seed": 1234, + "epochs": 20000, + "learning_rate": 0.0002, + "betas": [ + 0.8, + 0.99 + ], + "eps": 1e-09, + "batch_size": 64, + "fp16_run": true, + "lr_decay": 0.999875, + "segment_size": 8192, + "init_lr_ratio": 1, + "warmup_epochs": 0, + "c_mel": 45, + "c_kl": 1.0 + }, + "data": { + "training_files": "train.ltr", + "validation_files": "dev.ltr", + "text_cleaners": [ + "transliteration_cleaners" + ], + "max_wav_value": 32768.0, + "sampling_rate": 16000, + "filter_length": 1024, + "hop_length": 256, + "win_length": 1024, + "n_mel_channels": 80, + "mel_fmin": 0.0, + "mel_fmax": null, + "add_blank": true, + "n_speakers": 0, + "cleaned_text": true + }, + "model": { + "inter_channels": 192, + "hidden_channels": 192, + "filter_channels": 768, + "n_heads": 2, + "n_layers": 6, + "kernel_size": 3, + "p_dropout": 0.1, + "resblock": "1", + "resblock_kernel_sizes": [ + 3, + 7, + 11 + ], + "resblock_dilation_sizes": [ + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ], + [ + 1, + 3, + 5 + ] + ], + "upsample_rates": [ + 8, + 8, + 2, + 2 + ], + "upsample_initial_channel": 512, + "upsample_kernel_sizes": [ + 16, + 16, + 4, + 4 + ], + "n_layers_q": 3, + "use_spectral_norm": false + } +} \ No newline at end of file diff --git a/full_models/zza/vocab.txt b/full_models/zza/vocab.txt new file mode 100755 index 0000000000000000000000000000000000000000..0fde70484b16f7364d5272cbdaa7b7d603382565 --- /dev/null +++ b/full_models/zza/vocab.txt @@ -0,0 +1,35 @@ +| +a +e +n +i +r +ê +î +y +o +d +m +k +w +b +t +s +h +l +ş +z +v +x +j +u +q +g +p +c +ç +û +f +' +- +