JiHungLin commited on
Commit
796f97d
1 Parent(s): 976a543

Saving train state of step 50

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-large-v3",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
 
1
  {
2
+ "_name_or_path": "./distil-large-v3-init",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "apply_spec_augment": false,
distil-whisper/events.out.tfevents.1713339458.mycena-3090.108763.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90f93557093b773784b3994c6fdde2d1b34296f695318bb742b29bfb082c0a48
3
+ size 88
distil-whisper/events.out.tfevents.1713339486.mycena-3090.109177.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0438dc8d20b30444cd5f1848ec0cf9c3536e9e50be3f530c956772bab72e203
3
+ size 696
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a81674d4973bf8cbf2e1b696063c781f3cf2b595e3a93bf160dbb2ee4e3289f
3
+ size 3025686376
run_distillation.py CHANGED
@@ -1297,7 +1297,10 @@ def main():
1297
  # we do not want to group tokens when computing the metrics
1298
  label_str = tokenizer.batch_decode(labels, skip_special_tokens=True)
1299
  # !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1
1300
- # wer_ortho = 100 * metric.compute(predictions=pred_str, references=label_str)
 
 
 
1301
  wer_ortho = 100 * chinese_wer(pred_str, label_str)
1302
 
1303
  # normalize everything and re-compute the WER
 
1297
  # we do not want to group tokens when computing the metrics
1298
  label_str = tokenizer.batch_decode(labels, skip_special_tokens=True)
1299
  # !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1
1300
+ print("pred_str: ", pred_str)
1301
+ print("label_str: ", label_str)
1302
+ print("!!!!!!!!!!!!!!!!!!!!!!!!!")
1303
+ wer_ortho = 100 * metric.compute(predictions=pred_str, references=label_str)
1304
  wer_ortho = 100 * chinese_wer(pred_str, label_str)
1305
 
1306
  # normalize everything and re-compute the WER