End of training

Browse files

Files changed (8) hide show

README.md +118 -0
config.json +275 -0
generation_config.json +15 -0
model.safetensors +3 -0
predictions_common_voice_13_en_common_voice_13_en_test_wer19.47.csv +0 -0
predictions_common_voice_13_en_common_voice_13_en_test_wer19.47_hyp.trn +0 -0
predictions_common_voice_13_en_common_voice_13_en_test_wer19.47_ref.trn +0 -0
training_args.bin +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,118 @@

+---
+tags:
+- generated_from_trainer
+datasets:
+- common_voice_13_0
+metrics:
+- wer
+model-index:
+- name: DeCRED_small_cv_2
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# DeCRED_small_cv_2
+This model is a fine-tuned version of [](https://huggingface.co/) on the common_voice_13_0 dataset.
+It achieves the following results on the evaluation set:
+- Loss: 1.0669
+- Cer: 0.0663
+- Wer: 0.1563
+- Mer: 0.1532
+- Wil: 0.2546
+- Wip: 0.7454
+- Hits: 128002
+- Substitutions: 17367
+- Deletions: 2812
+- Insertions: 2975
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.002
+- train_batch_size: 128
+- eval_batch_size: 64
+- seed: 42
+- distributed_type: multi-GPU
+- num_devices: 2
+- total_train_batch_size: 256
+- total_eval_batch_size: 128
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- lr_scheduler_warmup_steps: 10000
+- num_epochs: 50.0
+### Training results
+| Training Loss | Epoch | Step   | Cer    | Deletions | Hits   | Insertions | Validation Loss | Mer    | Substitutions | Wer    | Wil    | Wip    |
+|:-------------:|:-----:|:------:|:------:|:---------:|:------:|:----------:|:---------------:|:------:|:-------------:|:------:|:------:|:------:|
+| 1.6144        | 5.0   | 14885  | 0.1526 | 5701      | 107636 | 6856       | 1.4427          | 0.3057 | 34844         | 0.3199 | 0.4765 | 0.5235 |
+| 1.5552        | 6.0   | 17862  | 0.1438 | 5401      | 109845 | 6588       | 1.3968          | 0.2903 | 32935         | 0.3032 | 0.4549 | 0.5451 |
+| 1.5102        | 7.0   | 20839  | 0.1327 | 5227      | 112073 | 5890       | 1.3578          | 0.2726 | 30881         | 0.2834 | 0.4305 | 0.5695 |
+| 1.4504        | 8.0   | 23816  | 0.1256 | 4512      | 113841 | 5758       | 1.3262          | 0.2605 | 29828         | 0.2706 | 0.4147 | 0.5853 |
+| 1.4098        | 9.0   | 26793  | 0.1195 | 4580      | 115426 | 5441       | 1.2918          | 0.2486 | 28175         | 0.2578 | 0.3967 | 0.6033 |
+| 1.3717        | 10.0  | 29770  | 0.1146 | 4666      | 116052 | 4869       | 1.2777          | 0.2417 | 27463         | 0.2497 | 0.3875 | 0.6125 |
+| 1.3573        | 11.0  | 32747  | 0.1123 | 4193      | 117058 | 5268       | 1.2628          | 0.2372 | 26930         | 0.2456 | 0.3804 | 0.6196 |
+| 1.3433        | 12.0  | 35724  | 0.1085 | 4814      | 117567 | 4293       | 1.2455          | 0.2289 | 25800         | 0.2356 | 0.3683 | 0.6317 |
+| 1.3281        | 13.0  | 38701  | 0.1068 | 3789      | 118972 | 5402       | 1.2333          | 0.2254 | 25420         | 0.2336 | 0.3623 | 0.6377 |
+| 1.3068        | 14.0  | 41678  | 0.1019 | 4076      | 119434 | 4622       | 1.2159          | 0.2184 | 24671         | 0.2252 | 0.3527 | 0.6473 |
+| 1.2847        | 15.0  | 44655  | 0.1017 | 4042      | 119608 | 4683       | 1.2081          | 0.2176 | 24531         | 0.2244 | 0.3513 | 0.6487 |
+| 1.2753        | 16.0  | 47632  | 0.1007 | 4211      | 119928 | 4304       | 1.2023          | 0.2135 | 24042         | 0.2197 | 0.3454 | 0.6546 |
+| 1.2793        | 17.0  | 50609  | 0.0950 | 3660      | 121093 | 4365       | 1.1862          | 0.2062 | 23428         | 0.2123 | 0.3354 | 0.6646 |
+| 1.2676        | 18.0  | 53586  | 0.0927 | 3813      | 121198 | 4207       | 1.1843          | 0.2047 | 23170         | 0.2105 | 0.3328 | 0.6672 |
+| 1.2256        | 19.0  | 56563  | 0.0936 | 3948      | 121257 | 4033       | 1.1795          | 0.2034 | 22976         | 0.2089 | 0.3308 | 0.6692 |
+| 1.2238        | 20.0  | 59540  | 0.0932 | 3634      | 121864 | 4372       | 1.1736          | 0.2012 | 22683         | 0.2071 | 0.3270 | 0.6730 |
+| 1.2206        | 21.0  | 62517  | 0.0892 | 3862      | 122333 | 3732       | 1.1623          | 0.1947 | 21986         | 0.1996 | 0.3178 | 0.6822 |
+| 1.2018        | 22.0  | 65494  | 0.0893 | 4037      | 122051 | 3703       | 1.1614          | 0.1964 | 22093         | 0.2013 | 0.3200 | 0.6800 |
+| 1.1791        | 23.0  | 68471  | 1.1510 | 0.0868    | 0.1953 | 0.1906     | 0.3114          | 0.6886 | 122943        | 21479  | 3759   | 3708   |
+| 1.1958        | 24.0  | 71448  | 1.1438 | 0.0855    | 0.1931 | 0.1883     | 0.3078          | 0.6922 | 123356        | 21215  | 3610   | 3784   |
+| 1.1672        | 25.0  | 74425  | 1.1420 | 0.0863    | 0.1940 | 0.1891     | 0.3088          | 0.6912 | 123289        | 21266  | 3626   | 3861   |
+| 1.1595        | 26.0  | 77402  | 1.1358 | 0.0843    | 0.1898 | 0.1852     | 0.3026          | 0.6974 | 123784        | 20743  | 3654   | 3735   |
+| 1.1803        | 27.0  | 80379  | 1.1343 | 0.0838    | 0.1901 | 0.1856     | 0.3041          | 0.6959 | 123595        | 20966  | 3620   | 3580   |
+| 1.1488        | 28.0  | 83356  | 1.1262 | 0.0810    | 0.1855 | 0.1809     | 0.2972          | 0.7028 | 124441        | 20511  | 3229   | 3746   |
+| 1.1303        | 29.0  | 86333  | 1.1233 | 0.0801    | 0.1837 | 0.1793     | 0.2946          | 0.7054 | 124600        | 20302  | 3279   | 3636   |
+| 1.1266        | 30.0  | 89310  | 1.1203 | 0.0791    | 0.1818 | 0.1777     | 0.2918          | 0.7082 | 124687        | 20007  | 3487   | 3447   |
+| 1.14          | 31.0  | 92287  | 1.1179 | 0.0790    | 0.1813 | 0.1769     | 0.2905          | 0.7095 | 124938        | 19925  | 3318   | 3616   |
+| 1.1151        | 32.0  | 95264  | 1.1115 | 0.0776    | 0.1794 | 0.1752     | 0.2885          | 0.7115 | 125137        | 19847  | 3197   | 3534   |
+| 1.1043        | 33.0  | 98241  | 1.1080 | 0.0773    | 0.1785 | 0.1744     | 0.2866          | 0.7134 | 125253        | 19624  | 3304   | 3522   |
+| 1.1157        | 34.0  | 101218 | 1.1039 | 0.0762    | 0.1750 | 0.1710     | 0.2817          | 0.7183 | 125705        | 19302  | 3174   | 3458   |
+| 1.0911        | 35.0  | 104195 | 1.1004 | 0.0747    | 0.1740 | 0.1700     | 0.2800          | 0.7200 | 125869        | 19160  | 3152   | 3466   |
+| 1.0722        | 36.0  | 107172 | 1.0978 | 0.0743    | 0.1719 | 0.1684     | 0.2776          | 0.7224 | 125819        | 18952  | 3410   | 3111   |
+| 1.092         | 37.0  | 110149 | 1.0953 | 0.0742    | 0.1714 | 0.1676     | 0.2763          | 0.7237 | 126142        | 18878  | 3161   | 3362   |
+| 1.0763        | 38.0  | 113126 | 1.0914 | 0.0722    | 0.1686 | 0.1651     | 0.2726          | 0.7274 | 126377        | 18617  | 3187   | 3181   |
+| 1.0667        | 39.0  | 116103 | 1.0918 | 0.0729    | 0.1690 | 0.1654     | 0.2728          | 0.7272 | 126366        | 18602  | 3213   | 3224   |
+| 1.0651        | 40.0  | 119080 | 1.0845 | 0.0718    | 0.1662 | 0.1627     | 0.2690          | 0.7310 | 126749        | 18373  | 3059   | 3191   |
+| 1.0761        | 41.0  | 122057 | 1.0836 | 0.0703    | 0.1648 | 0.1614     | 0.2673          | 0.7327 | 126911        | 18271  | 2999   | 3156   |
+| 1.0509        | 42.0  | 125034 | 1.0828 | 0.0709    | 0.1647 | 0.1615     | 0.2670          | 0.7330 | 126714        | 18177  | 3290   | 2942   |
+| 1.0409        | 43.0  | 128011 | 1.0798 | 0.0707    | 0.1640 | 0.1607     | 0.2658          | 0.7342 | 126946        | 18103  | 3132   | 3070   |
+| 1.0525        | 44.0  | 130988 | 1.0760 | 0.0688    | 0.1608 | 0.1575     | 0.2614          | 0.7386 | 127451        | 17870  | 2860   | 3100   |
+| 1.0359        | 45.0  | 133965 | 1.0745 | 0.0680    | 0.1601 | 0.1568     | 0.2602          | 0.7398 | 127571        | 17771  | 2839   | 3115   |
+| 1.0144        | 46.0  | 136942 | 1.0738 | 0.0681    | 0.1607 | 0.1574     | 0.2614          | 0.7386 | 127503        | 17888  | 2790   | 3139   |
+| 1.054         | 47.0  | 139919 | 1.0691 | 0.0672    | 0.1586 | 0.1554     | 0.2578          | 0.7422 | 127745        | 17575  | 2861   | 3062   |
+| 1.0427        | 48.0  | 142896 | 1.0681 | 0.0667    | 0.1573 | 0.1542     | 0.2562          | 0.7438 | 127851        | 17473  | 2857   | 2981   |
+| 1.0067        | 49.0  | 145873 | 1.0682 | 0.0668    | 0.1568 | 0.1537     | 0.2553          | 0.7447 | 127906        | 17401  | 2874   | 2957   |
+| 1.0054        | 50.0  | 148850 | 1.0669 | 0.0663    | 0.1563 | 0.1532     | 0.2546          | 0.7454 | 128002        | 17367  | 2812   | 2975   |
+### Framework versions
+- Transformers 4.40.0.dev0
+- Pytorch 2.2.0+rocm5.6
+- Datasets 2.18.0
+- Tokenizers 0.15.2

config.json ADDED Viewed

	@@ -0,0 +1,275 @@

+{
+  "architectures": [
+    "JointCTCAttentionEncoderDecoder"
+  ],
+  "bos_token_id": 0,
+  "ctc_weight": 0.3,
+  "decoder": {
+    "_name_or_path": "Lakoc/gpt2_256h_6l_add_head3_04",
+    "activation_function": "gelu_new",
+    "add_cross_attention": true,
+    "architectures": null,
+    "attn_pdrop": 0.1,
+    "average_logits": false,
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": 0,
+    "chunk_size_feed_forward": 0,
+    "cross_attention_hidden_size": null,
+    "decoder_start_token_id": null,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "early_stopping": false,
+    "embd_pdrop": 0.1,
+    "encoder_no_repeat_ngram_size": 0,
+    "eos_token_id": 1,
+    "exponential_decay_length_penalty": null,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "head_locations": [
+      3
+    ],
+    "head_weights": [
+      0.6,
+      0.4
+    ],
+    "id2label": {
+      "0": "LABEL_0",
+      "1": "LABEL_1"
+    },
+    "initializer_range": 0.02,
+    "is_decoder": true,
+    "is_encoder_decoder": false,
+    "label2id": {
+      "LABEL_0": 0,
+      "LABEL_1": 1
+    },
+    "layer_norm_epsilon": 1e-05,
+    "length_penalty": 1.0,
+    "max_length": 20,
+    "min_length": 0,
+    "model_type": "gpt2-multi-head",
+    "n_embd": 256,
+    "n_head": 4,
+    "n_inner": 2048,
+    "n_layer": 6,
+    "n_positions": 1024,
+    "no_repeat_ngram_size": 0,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": null,
+    "pos_emb_fixed": true,
+    "prefix": null,
+    "problem_type": null,
+    "pruned_heads": {},
+    "remove_invalid_values": false,
+    "reorder_and_upcast_attn": false,
+    "repetition_penalty": 1.0,
+    "resid_pdrop": 0.1,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "scale_attn_by_inverse_layer_idx": false,
+    "scale_attn_weights": true,
+    "sep_token_id": null,
+    "summary_activation": null,
+    "summary_first_dropout": 0.1,
+    "summary_proj_to_labels": true,
+    "summary_type": "cls_index",
+    "summary_use_proj": true,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "temperature": 1.0,
+    "tf_legacy_loss": false,
+    "tie_additional_weights": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": false,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": null,
+    "torchscript": false,
+    "typical_p": 1.0,
+    "use_bfloat16": false,
+    "use_cache": true,
+    "vocab_size": 1000
+  },
+  "decoder_start_token_id": 0,
+  "encoder": {
+    "_name_or_path": "Lakoc/fisher_ebranchformer_enc_12_layers_fixed",
+    "activation_dropout": 0.1,
+    "adapter_attn_dim": null,
+    "adapter_kernel_size": 3,
+    "adapter_stride": 2,
+    "add_adapter": false,
+    "add_cross_attention": false,
+    "apply_spec_augment": false,
+    "architectures": null,
+    "attention_dropout": 0.1,
+    "bad_words_ids": null,
+    "begin_suppress_tokens": null,
+    "bos_token_id": 1,
+    "chunk_size_feed_forward": 0,
+    "classifier_proj_size": 256,
+    "codevector_dim": 256,
+    "conformer_conv_dropout": 0.1,
+    "contrastive_logits_temperature": 0.1,
+    "conv_bias": false,
+    "conv_depthwise_kernel_size": 31,
+    "conv_dim": [
+      256,
+      256
+    ],
+    "conv_kernel": [
+      3,
+      3
+    ],
+    "conv_padding": [
+      1,
+      1
+    ],
+    "conv_stride": [
+      2,
+      2
+    ],
+    "cross_attention_hidden_size": null,
+    "csgu_activation": "identity",
+    "csgu_conv_dropout": 0.1,
+    "csgu_kernel_size": 31,
+    "csgu_use_linear_after_conv": false,
+    "ctc_loss_reduction": "mean",
+    "ctc_zero_infinity": true,
+    "decoder_start_token_id": null,
+    "diversity_loss_weight": 0.1,
+    "diversity_penalty": 0.0,
+    "do_sample": false,
+    "do_stable_layer_norm": false,
+    "early_stopping": false,
+    "encoder_no_repeat_ngram_size": 0,
+    "eos_token_id": 2,
+    "exponential_decay_length_penalty": null,
+    "fe_position_embeddings": false,
+    "feat_extract_activation": "gelu",
+    "feat_extract_norm": "group",
+    "feat_proj_dropout": 0.0,
+    "feat_quantizer_dropout": 0.0,
+    "final_dropout": 0.1,
+    "finetuning_task": null,
+    "forced_bos_token_id": null,
+    "forced_eos_token_id": null,
+    "hidden_act": "gelu",
+    "hidden_dropout": 0.1,
+    "hidden_size": 256,
+    "id2label": {
+      "0": "LABEL_0",
+      "1": "LABEL_1"
+    },
+    "initializer_range": 0.02,
+    "intermediate_size": 1024,
+    "is_causal": false,
+    "is_decoder": false,
+    "is_encoder_decoder": false,
+    "label2id": {
+      "LABEL_0": 0,
+      "LABEL_1": 1
+    },
+    "layer_norm_eps": 1e-05,
+    "layerdrop": 0.0,
+    "length_penalty": 1.0,
+    "mask_feature_length": 10,
+    "mask_feature_min_masks": 0,
+    "mask_feature_prob": 0.0,
+    "mask_time_length": 10,
+    "mask_time_min_masks": 2,
+    "mask_time_prob": 0.05,
+    "max_length": 20,
+    "max_source_positions": 1024,
+    "merge_conv_kernel": 31,
+    "min_length": 0,
+    "model_type": "wav2vec2-ebranchformer",
+    "no_repeat_ngram_size": 0,
+    "num_adapter_layers": 3,
+    "num_attention_heads": 4,
+    "num_beam_groups": 1,
+    "num_beams": 1,
+    "num_codevector_groups": 2,
+    "num_codevectors_per_group": 320,
+    "num_conv_pos_embedding_groups": 16,
+    "num_conv_pos_embeddings": 128,
+    "num_fbanks": 80,
+    "num_feat_extract_layers": 2,
+    "num_hidden_layers": 12,
+    "num_mel_bins": 80,
+    "num_negatives": 100,
+    "num_return_sequences": 1,
+    "output_attentions": false,
+    "output_hidden_size": 256,
+    "output_hidden_states": false,
+    "output_scores": false,
+    "pad_token_id": 3,
+    "position_embeddings_type": "relative",
+    "prefix": null,
+    "problem_type": null,
+    "proj_codevector_dim": 256,
+    "pruned_heads": {},
+    "remove_invalid_values": false,
+    "repetition_penalty": 1.0,
+    "return_dict": true,
+    "return_dict_in_generate": false,
+    "rotary_embedding_base": 10000,
+    "sep_token_id": null,
+    "suppress_tokens": null,
+    "task_specific_params": null,
+    "tdnn_dilation": [
+      1,
+      2,
+      3,
+      1,
+      1
+    ],
+    "tdnn_dim": [
+      512,
+      512,
+      512,
+      512,
+      1500
+    ],
+    "tdnn_kernel": [
+      5,
+      3,
+      3,
+      1,
+      1
+    ],
+    "temperature": 1.0,
+    "tf_legacy_loss": false,
+    "tie_encoder_decoder": false,
+    "tie_word_embeddings": true,
+    "tokenizer_class": null,
+    "top_k": 50,
+    "top_p": 1.0,
+    "torch_dtype": null,
+    "torchscript": false,
+    "typical_p": 1.0,
+    "use_bfloat16": false,
+    "use_fbanks": true,
+    "use_macaron_ff": true,
+    "use_weighted_layer_sum": false,
+    "vocab_size": 1000,
+    "xvector_output_dim": 512
+  },
+  "eos_token_id": 1,
+  "is_encoder_decoder": true,
+  "lsm_factor": 0.1,
+  "mask_token_id": 4,
+  "model_type": "joint_aed_ctc_speech-encoder-decoder",
+  "pad_token_id": 3,
+  "shared_lm_head": false,
+  "tie_word_embeddings": false,
+  "torch_dtype": "float32",
+  "transformers_version": "4.40.0.dev0"
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "apply_eos_space_trick": false,
+  "bos_token_id": 0,
+  "ctc_margin": 0,
+  "ctc_weight": 0.0,
+  "decoder_start_token_id": 0,
+  "eos_space_trick_weight": 0.0,
+  "eos_token_id": 1,
+  "lm_model": null,
+  "lm_weight": 0.0,
+  "max_length": 512,
+  "pad_token_id": 3,
+  "space_token_id": -1,
+  "transformers_version": "4.40.0.dev0"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d76549a0d7e10e586fdab217fb2431b1e0bcfb5d17f9839a30dd537d3e187303
+size 144243216

predictions_common_voice_13_en_common_voice_13_en_test_wer19.47.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

predictions_common_voice_13_en_common_voice_13_en_test_wer19.47_hyp.trn ADDED Viewed

The diff for this file is too large to render. See raw diff

predictions_common_voice_13_en_common_voice_13_en_test_wer19.47_ref.trn ADDED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ff64ef1971f96d63c84ef22dd935a383b14e09ebbe15cece61b3429bfa7b8760
+size 5816