Sagicc commited on
Commit
66cc2ab
1 Parent(s): ab9f0a5

End of training

Browse files
Files changed (2) hide show
  1. README.md +32 -5
  2. generation_config.json +7 -1
README.md CHANGED
@@ -1,23 +1,42 @@
1
  ---
2
  language:
3
- - dv
4
  license: apache-2.0
5
  base_model: openai/whisper-small
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
  - mozilla-foundation/common_voice_13_0
 
 
10
  model-index:
11
- - name: Whisper Small Dv - Sanchit Gandhi
12
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  ---
14
 
15
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
16
  should probably proofread and complete it, then remove this comment. -->
17
 
18
- # Whisper Small Dv - Sanchit Gandhi
19
 
20
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 13 dataset.
 
 
 
 
21
 
22
  ## Model description
23
 
@@ -43,7 +62,15 @@ The following hyperparameters were used during training:
43
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
44
  - lr_scheduler_type: constant_with_warmup
45
  - lr_scheduler_warmup_steps: 50
46
- - training_steps: 500
 
 
 
 
 
 
 
 
47
 
48
  ### Framework versions
49
 
 
1
  ---
2
  language:
3
+ - sr
4
  license: apache-2.0
5
  base_model: openai/whisper-small
6
  tags:
7
  - generated_from_trainer
8
  datasets:
9
  - mozilla-foundation/common_voice_13_0
10
+ metrics:
11
+ - wer
12
  model-index:
13
+ - name: Whisper Small Sr - Sagicc
14
+ results:
15
+ - task:
16
+ name: Automatic Speech Recognition
17
+ type: automatic-speech-recognition
18
+ dataset:
19
+ name: Common Voice 13
20
+ type: mozilla-foundation/common_voice_13_0
21
+ config: sr
22
+ split: test
23
+ args: sr
24
+ metrics:
25
+ - name: Wer
26
+ type: wer
27
+ value: 18.092962641181582
28
  ---
29
 
30
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
31
  should probably proofread and complete it, then remove this comment. -->
32
 
33
+ # Whisper Small Sr - Sagicc
34
 
35
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 13 dataset.
36
+ It achieves the following results on the evaluation set:
37
+ - Loss: 0.3675
38
+ - Wer Ortho: 28.9565
39
+ - Wer: 18.0930
40
 
41
  ## Model description
42
 
 
62
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
63
  - lr_scheduler_type: constant_with_warmup
64
  - lr_scheduler_warmup_steps: 50
65
+ - training_steps: 1000
66
+
67
+ ### Training results
68
+
69
+ | Training Loss | Epoch | Step | Validation Loss | Wer Ortho | Wer |
70
+ |:-------------:|:-----:|:----:|:---------------:|:---------:|:-------:|
71
+ | 0.0728 | 2.87 | 500 | 0.2978 | 29.5435 | 18.8749 |
72
+ | 0.0318 | 5.75 | 1000 | 0.3675 | 28.9565 | 18.0930 |
73
+
74
 
75
  ### Framework versions
76
 
generation_config.json CHANGED
@@ -51,11 +51,15 @@
51
  "forced_decoder_ids": [
52
  [
53
  1,
54
- null
55
  ],
56
  [
57
  2,
58
  50359
 
 
 
 
59
  ]
60
  ],
61
  "is_multilingual": true,
@@ -160,6 +164,7 @@
160
  "<|yo|>": 50325,
161
  "<|zh|>": 50260
162
  },
 
163
  "max_initial_timestamp_index": 1,
164
  "max_length": 448,
165
  "no_timestamps_token_id": 50363,
@@ -255,6 +260,7 @@
255
  50361,
256
  50362
257
  ],
 
258
  "task_to_id": {
259
  "transcribe": 50359,
260
  "translate": 50358
 
51
  "forced_decoder_ids": [
52
  [
53
  1,
54
+ 50303
55
  ],
56
  [
57
  2,
58
  50359
59
+ ],
60
+ [
61
+ 3,
62
+ 50363
63
  ]
64
  ],
65
  "is_multilingual": true,
 
164
  "<|yo|>": 50325,
165
  "<|zh|>": 50260
166
  },
167
+ "language": "serbian",
168
  "max_initial_timestamp_index": 1,
169
  "max_length": 448,
170
  "no_timestamps_token_id": 50363,
 
260
  50361,
261
  50362
262
  ],
263
+ "task": "transcribe",
264
  "task_to_id": {
265
  "transcribe": 50359,
266
  "translate": 50358