Chahat7874 commited on
Commit
efc63d1
1 Parent(s): cadf363

End of training

Browse files
README.md CHANGED
@@ -1,13 +1,33 @@
1
  ---
 
 
2
  license: apache-2.0
3
  base_model: facebook/wav2vec2-large-xlsr-53
4
  tags:
 
 
 
5
  - generated_from_trainer
6
  datasets:
7
  - common_voice_15_0
 
 
8
  model-index:
9
  - name: wav2vec2-common_voice-en-demo
10
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  ---
12
 
13
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -15,7 +35,10 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # wav2vec2-common_voice-en-demo
17
 
18
- This model is a fine-tuned version of [facebook/wav2vec2-large-xlsr-53](https://huggingface.co/facebook/wav2vec2-large-xlsr-53) on the common_voice_15_0 dataset.
 
 
 
19
 
20
  ## Model description
21
 
 
1
  ---
2
+ language:
3
+ - hi
4
  license: apache-2.0
5
  base_model: facebook/wav2vec2-large-xlsr-53
6
  tags:
7
+ - automatic-speech-recognition
8
+ - mozilla-foundation/common_voice_15_0
9
+ - mms
10
  - generated_from_trainer
11
  datasets:
12
  - common_voice_15_0
13
+ metrics:
14
+ - wer
15
  model-index:
16
  - name: wav2vec2-common_voice-en-demo
17
+ results:
18
+ - task:
19
+ name: Automatic Speech Recognition
20
+ type: automatic-speech-recognition
21
+ dataset:
22
+ name: MOZILLA-FOUNDATION/COMMON_VOICE_15_0 - HI
23
+ type: common_voice_15_0
24
+ config: hi
25
+ split: validation
26
+ args: 'Config: hi, Training split: train, Eval split: validation'
27
+ metrics:
28
+ - name: Wer
29
+ type: wer
30
+ value: 1.0018709995076318
31
  ---
32
 
33
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
35
 
36
  # wav2vec2-common_voice-en-demo
37
 
38
+ This model is a fine-tuned version of [facebook/wav2vec2-large-xlsr-53](https://huggingface.co/facebook/wav2vec2-large-xlsr-53) on the MOZILLA-FOUNDATION/COMMON_VOICE_15_0 - HI dataset.
39
+ It achieves the following results on the evaluation set:
40
+ - Loss: 20.2335
41
+ - Wer: 1.0019
42
 
43
  ## Model description
44
 
adapter.eng.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a8f7630ac9b159754bf09a63f4c2101535a1287172d38e194eb4ea08c5e32bf
3
  size 3918936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f16202c0de9c8feeaa1cf336a6630fc754a6ed13dca6fb50a2468e0c7c3f94d2
3
  size 3918936
all_results.json CHANGED
@@ -1,15 +1,15 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_loss": 3.4593591690063477,
4
- "eval_runtime": 163.4642,
5
  "eval_samples": 2416,
6
- "eval_samples_per_second": 14.78,
7
- "eval_steps_per_second": 1.847,
8
- "eval_wer": 1.0,
9
- "total_flos": 3.0520251232525025e+18,
10
- "train_loss": 7.648091746363146,
11
- "train_runtime": 3314.4653,
12
  "train_samples": 4630,
13
- "train_samples_per_second": 6.985,
14
- "train_steps_per_second": 0.219
15
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_loss": 20.233524322509766,
4
+ "eval_runtime": 167.9773,
5
  "eval_samples": 2416,
6
+ "eval_samples_per_second": 14.383,
7
+ "eval_steps_per_second": 1.798,
8
+ "eval_wer": 1.0018709995076318,
9
+ "total_flos": 6.105598680744346e+17,
10
+ "train_loss": 18.518729795258622,
11
+ "train_runtime": 625.4328,
12
  "train_samples": 4630,
13
+ "train_samples_per_second": 7.403,
14
+ "train_steps_per_second": 0.232
15
  }
eval_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 5.0,
3
- "eval_loss": 3.4593591690063477,
4
- "eval_runtime": 163.4642,
5
  "eval_samples": 2416,
6
- "eval_samples_per_second": 14.78,
7
- "eval_steps_per_second": 1.847,
8
- "eval_wer": 1.0
9
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "eval_loss": 20.233524322509766,
4
+ "eval_runtime": 167.9773,
5
  "eval_samples": 2416,
6
+ "eval_samples_per_second": 14.383,
7
+ "eval_steps_per_second": 1.798,
8
+ "eval_wer": 1.0018709995076318
9
  }
runs/May24_13-44-28_05119ae56480/events.out.tfevents.1716559249.05119ae56480.2817.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec1182a66fbf3e89b77dd386abe585ba9c3521b30e40c773a7181b58f5acefd2
3
+ size 406
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "epoch": 5.0,
3
- "total_flos": 3.0520251232525025e+18,
4
- "train_loss": 7.648091746363146,
5
- "train_runtime": 3314.4653,
6
  "train_samples": 4630,
7
- "train_samples_per_second": 6.985,
8
- "train_steps_per_second": 0.219
9
  }
 
1
  {
2
+ "epoch": 1.0,
3
+ "total_flos": 6.105598680744346e+17,
4
+ "train_loss": 18.518729795258622,
5
+ "train_runtime": 625.4328,
6
  "train_samples": 4630,
7
+ "train_samples_per_second": 7.403,
8
+ "train_steps_per_second": 0.232
9
  }
trainer_state.json CHANGED
@@ -1,97 +1,36 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.0,
5
  "eval_steps": 100,
6
- "global_step": 725,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.6896551724137931,
13
- "eval_loss": 21.946964263916016,
14
- "eval_runtime": 163.3947,
15
- "eval_samples_per_second": 14.786,
16
- "eval_steps_per_second": 1.848,
17
  "eval_wer": 1.0003446578040374,
18
  "step": 100
19
  },
20
  {
21
- "epoch": 1.3793103448275863,
22
- "eval_loss": 17.29347801208496,
23
- "eval_runtime": 162.2438,
24
- "eval_samples_per_second": 14.891,
25
- "eval_steps_per_second": 1.861,
26
- "eval_wer": 1.0,
27
- "step": 200
28
- },
29
- {
30
- "epoch": 2.0689655172413794,
31
- "eval_loss": 3.521054267883301,
32
- "eval_runtime": 161.4701,
33
- "eval_samples_per_second": 14.963,
34
- "eval_steps_per_second": 1.87,
35
- "eval_wer": 1.0,
36
- "step": 300
37
- },
38
- {
39
- "epoch": 2.7586206896551726,
40
- "eval_loss": 3.507359027862549,
41
- "eval_runtime": 160.5709,
42
- "eval_samples_per_second": 15.046,
43
- "eval_steps_per_second": 1.881,
44
- "eval_wer": 1.0,
45
- "step": 400
46
- },
47
- {
48
- "epoch": 3.4482758620689653,
49
- "grad_norm": 0.5087113976478577,
50
- "learning_rate": 0.00029759999999999997,
51
- "loss": 9.5434,
52
- "step": 500
53
- },
54
- {
55
- "epoch": 3.4482758620689653,
56
- "eval_loss": 3.4881255626678467,
57
- "eval_runtime": 161.0375,
58
- "eval_samples_per_second": 15.003,
59
- "eval_steps_per_second": 1.875,
60
- "eval_wer": 1.0,
61
- "step": 500
62
- },
63
- {
64
- "epoch": 4.137931034482759,
65
- "eval_loss": 3.487558603286743,
66
- "eval_runtime": 159.8397,
67
- "eval_samples_per_second": 15.115,
68
- "eval_steps_per_second": 1.889,
69
- "eval_wer": 1.0,
70
- "step": 600
71
- },
72
- {
73
- "epoch": 4.827586206896552,
74
- "eval_loss": 3.489640951156616,
75
- "eval_runtime": 160.42,
76
- "eval_samples_per_second": 15.06,
77
- "eval_steps_per_second": 1.883,
78
- "eval_wer": 1.0,
79
- "step": 700
80
- },
81
- {
82
- "epoch": 5.0,
83
- "step": 725,
84
- "total_flos": 3.0520251232525025e+18,
85
- "train_loss": 7.648091746363146,
86
- "train_runtime": 3314.4653,
87
- "train_samples_per_second": 6.985,
88
- "train_steps_per_second": 0.219
89
  }
90
  ],
91
  "logging_steps": 500,
92
- "max_steps": 725,
93
  "num_input_tokens_seen": 0,
94
- "num_train_epochs": 5,
95
  "save_steps": 400,
96
  "stateful_callbacks": {
97
  "TrainerControl": {
@@ -105,7 +44,7 @@
105
  "attributes": {}
106
  }
107
  },
108
- "total_flos": 3.0520251232525025e+18,
109
  "train_batch_size": 16,
110
  "trial_name": null,
111
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0,
5
  "eval_steps": 100,
6
+ "global_step": 145,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.6896551724137931,
13
+ "eval_loss": 21.947891235351562,
14
+ "eval_runtime": 168.4847,
15
+ "eval_samples_per_second": 14.34,
16
+ "eval_steps_per_second": 1.792,
17
  "eval_wer": 1.0003446578040374,
18
  "step": 100
19
  },
20
  {
21
+ "epoch": 1.0,
22
+ "step": 145,
23
+ "total_flos": 6.105598680744346e+17,
24
+ "train_loss": 18.518729795258622,
25
+ "train_runtime": 625.4328,
26
+ "train_samples_per_second": 7.403,
27
+ "train_steps_per_second": 0.232
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  }
29
  ],
30
  "logging_steps": 500,
31
+ "max_steps": 145,
32
  "num_input_tokens_seen": 0,
33
+ "num_train_epochs": 1,
34
  "save_steps": 400,
35
  "stateful_callbacks": {
36
  "TrainerControl": {
 
44
  "attributes": {}
45
  }
46
  },
47
+ "total_flos": 6.105598680744346e+17,
48
  "train_batch_size": 16,
49
  "trial_name": null,
50
  "trial_params": null