File size: 1,335 Bytes
dfd6be9
 
 
 
 
 
 
 
25ea1ba
dfd6be9
25ea1ba
 
 
dfd6be9
25ea1ba
dfd6be9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
python run_speech_recognition_seq2seq_streaming.py \
      --model_name_or_path="openai/whisper-small" \
      --dataset_name="google/fleurs" \
      --dataset_config_name="ps_af" \
      --language="pashto" \
      --train_split_name="train+validation" \
      --eval_split_name="test" \
      --model_index_name="Whisper Small Pashto" \
      --max_steps="800" \
      --output_dir="./" \
      --per_device_train_batch_size="64" \
      --per_device_eval_batch_size="32" \
      --gradient_accumulation_steps="1" \
      --logging_steps="10" \
      --learning_rate="3e-7" \
      --warmup_steps="500" \
      --evaluation_strategy="steps" \
      --eval_steps="100" \
      --save_strategy="steps" \
      --save_steps="100" \
      --generation_max_length="225" \
      --length_column_name="input_length" \
      --max_duration_in_seconds="30" \
      --text_column_name="transcription" \
      --freeze_feature_encoder="False" \
      --report_to="tensorboard" \
      --metric_for_best_model="wer" \
      --greater_is_better="False" \
      --load_best_model_at_end \
      --gradient_checkpointing \
      --fp16 \
      --overwrite_output_dir="False" \
      --do_train \
      --do_eval \
      --predict_with_generate \
      --do_normalize_eval \
      --streaming="False" \
      --push_to_hub \
      --use_auth_token