marinone94
/

whisper-training-blog

Automatic Speech Recognition

Generated from Trainer

Inference Endpoints

Model card Files Files and versions Community

marinone94 commited on Jan 26, 2023

Commit

4123391

·

1 Parent(s): 3644968

delete checkpoint at the end

Files changed (1) hide show

huggingface_training.py +8 -1

huggingface_training.py CHANGED Viewed

@@ -282,8 +282,11 @@ training_args = Seq2SeqTrainingArguments(
     logging_steps=logging_steps,
     save_strategy="steps",
     save_steps=eval_steps,
-    save_total_limit=2,
     learning_rate=1e-5,
 	warmup_ratio=0.5 if test_script is True else 0.2,
     per_device_train_batch_size=train_bs,
     per_device_eval_batch_size=eval_bs,
@@ -370,4 +373,8 @@ print(final_metrics)
 # Pushing to hub during training slows down training
 # so we push it only in the end.
 trainer.push_to_hub()

     logging_steps=logging_steps,
     save_strategy="steps",
     save_steps=eval_steps,
+    # save_total_limit=2,
     learning_rate=1e-5,
+    load_best_model_at_end=True,
+    metric_for_best_model="wer",
+    greater_is_better=False,
 	warmup_ratio=0.5 if test_script is True else 0.2,
     per_device_train_batch_size=train_bs,
     per_device_eval_batch_size=eval_bs,
 # Pushing to hub during training slows down training
 # so we push it only in the end.
+# Since training is completed and best model has been saved, we first delete the checkpoints
+for filename in os.listdir("."):
+    if filename.startswith("checkpoint-"):
+        os.remove(f"./{filename}")
 trainer.push_to_hub()