emilios commited on
Commit
a11b257
·
1 Parent(s): fed5629
run.sh CHANGED
@@ -12,6 +12,7 @@ deepspeed run_speech_recognition_seq2seq_streaming-farsipal.py \
12
  --torch_compile_mode="reduce-overhead" \
13
  --torch_compile_mode="max-autotune" \
14
  --logging_steps="25" \
 
15
  --max_steps="5000" \
16
  --output_dir="./" \
17
  --per_device_train_batch_size="32" \
@@ -38,7 +39,7 @@ deepspeed run_speech_recognition_seq2seq_streaming-farsipal.py \
38
  --do_eval \
39
  --predict_with_generate \
40
  --do_normalize_eval \
41
- --streaming="False" \
42
  --use_auth_token \
43
  --push_to_hub
44
 
 
12
  --torch_compile_mode="reduce-overhead" \
13
  --torch_compile_mode="max-autotune" \
14
  --logging_steps="25" \
15
+ --learning_rate="1e-5" \
16
  --max_steps="5000" \
17
  --output_dir="./" \
18
  --per_device_train_batch_size="32" \
 
39
  --do_eval \
40
  --predict_with_generate \
41
  --do_normalize_eval \
42
+ --streaming="True" \
43
  --use_auth_token \
44
  --push_to_hub
45
 
run.sh.mlcommons CHANGED
@@ -12,6 +12,7 @@ deepspeed run_speech_recognition_seq2seq_streaming-farsipal.py \
12
  --torch_compile_mode="reduce-overhead" \
13
  --torch_compile_mode="max-autotune" \
14
  --logging_steps="25" \
 
15
  --max_steps="5000" \
16
  --output_dir="./" \
17
  --per_device_train_batch_size="32" \
 
12
  --torch_compile_mode="reduce-overhead" \
13
  --torch_compile_mode="max-autotune" \
14
  --logging_steps="25" \
15
+ --learning_rate="1e-5" \
16
  --max_steps="5000" \
17
  --output_dir="./" \
18
  --per_device_train_batch_size="32" \
run.sh.mlcommons-streaming ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ deepspeed run_speech_recognition_seq2seq_streaming-farsipal.py \
2
+ --deepspeed="ds_config.json" \
3
+ --model_name_or_path="emilios/whisper-medium-el" \
4
+ --dataset_name="mozilla-foundation/common_voice_11_0,google/fleurs,MLCommons/ml_spoken_words" \
5
+ --dataset_config_name="el,el_gr,el_wav" \
6
+ --language="greek" \
7
+ --train_split_name="train+validation,train+validation,train+validation" \
8
+ --eval_split_name="test,-,-" \
9
+ --model_index_name="Whisper medium Greek El Greco" \
10
+ --text_column_name="sentence,transcription,keyword" \
11
+ --torch_compile="True" \
12
+ --torch_compile_mode="reduce-overhead" \
13
+ --torch_compile_mode="max-autotune" \
14
+ --logging_steps="25" \
15
+ --learning_rate="1e-5" \
16
+ --max_steps="5000" \
17
+ --output_dir="./" \
18
+ --per_device_train_batch_size="32" \
19
+ --gradient_accumulation_steps="1" \
20
+ --per_device_eval_batch_size="16" \
21
+ --seed="42" \
22
+ --warmup_steps="500" \
23
+ --evaluation_strategy="steps" \
24
+ --eval_steps="1000" \
25
+ --save_strategy="steps" \
26
+ --save_steps="1000" \
27
+ --generation_max_length="225" \
28
+ --length_column_name="input_length" \
29
+ --max_duration_in_seconds="30" \
30
+ --freeze_feature_encoder="False" \
31
+ --report_to="tensorboard" \
32
+ --metric_for_best_model="wer" \
33
+ --greater_is_better="False" \
34
+ --load_best_model_at_end \
35
+ --gradient_checkpointing \
36
+ --fp16 \
37
+ --overwrite_output_dir \
38
+ --do_train \
39
+ --do_eval \
40
+ --predict_with_generate \
41
+ --do_normalize_eval \
42
+ --streaming="True" \
43
+ --use_auth_token \
44
+ --push_to_hub
45
+
runs/Dec21_11-16-44_129-146-176-120/events.out.tfevents.1671627320.129-146-176-120.3027155.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d20614f4043f3402001ae757a598a2ff189f2582afcd74ebb519420939924fb
3
- size 10883
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76c4eaee524692bbaaf5721be54975bfe624865adb19636f7a9b60cfec04955c
3
+ size 11668