Saving train state of step 50
Browse files
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"apply_spec_augment": false,
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "./distil-large-v3-init",
|
3 |
"activation_dropout": 0.0,
|
4 |
"activation_function": "gelu",
|
5 |
"apply_spec_augment": false,
|
distil-whisper/events.out.tfevents.1713339458.mycena-3090.108763.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90f93557093b773784b3994c6fdde2d1b34296f695318bb742b29bfb082c0a48
|
3 |
+
size 88
|
distil-whisper/events.out.tfevents.1713339486.mycena-3090.109177.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0438dc8d20b30444cd5f1848ec0cf9c3536e9e50be3f530c956772bab72e203
|
3 |
+
size 696
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a81674d4973bf8cbf2e1b696063c781f3cf2b595e3a93bf160dbb2ee4e3289f
|
3 |
+
size 3025686376
|
run_distillation.py
CHANGED
@@ -1297,7 +1297,10 @@ def main():
|
|
1297 |
# we do not want to group tokens when computing the metrics
|
1298 |
label_str = tokenizer.batch_decode(labels, skip_special_tokens=True)
|
1299 |
# !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1
|
1300 |
-
|
|
|
|
|
|
|
1301 |
wer_ortho = 100 * chinese_wer(pred_str, label_str)
|
1302 |
|
1303 |
# normalize everything and re-compute the WER
|
|
|
1297 |
# we do not want to group tokens when computing the metrics
|
1298 |
label_str = tokenizer.batch_decode(labels, skip_special_tokens=True)
|
1299 |
# !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!1
|
1300 |
+
print("pred_str: ", pred_str)
|
1301 |
+
print("label_str: ", label_str)
|
1302 |
+
print("!!!!!!!!!!!!!!!!!!!!!!!!!")
|
1303 |
+
wer_ortho = 100 * metric.compute(predictions=pred_str, references=label_str)
|
1304 |
wer_ortho = 100 * chinese_wer(pred_str, label_str)
|
1305 |
|
1306 |
# normalize everything and re-compute the WER
|