Training in progress, step 1000

Files changed (5) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "openai/whisper-large-v3",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "apply_spec_augment": false,
@@ -9,7 +9,7 @@
   "attention_dropout": 0.0,
   "begin_suppress_tokens": [
     220,
-    50257
   ],
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
@@ -17,7 +17,7 @@
   "decoder_attention_heads": 20,
   "decoder_ffn_dim": 5120,
   "decoder_layerdrop": 0.0,
-  "decoder_layers": 32,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
   "encoder_attention_heads": 20,
@@ -34,18 +34,16 @@
   "mask_time_length": 10,
   "mask_time_min_masks": 2,
   "mask_time_prob": 0.05,
-  "max_length": 448,
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
   "num_hidden_layers": 32,
   "num_mel_bins": 128,
-  "pad_token_id": 50256,
   "scale_embedding": false,
-  "suppress_tokens": [],
   "torch_dtype": "float32",
-  "transformers_version": "4.41.0.dev0",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51866

 {
+  "_name_or_path": "openai/whisper-large-v3-turbo",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "apply_spec_augment": false,
   "attention_dropout": 0.0,
   "begin_suppress_tokens": [
     220,
+    50256
   ],
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
   "decoder_attention_heads": 20,
   "decoder_ffn_dim": 5120,
   "decoder_layerdrop": 0.0,
+  "decoder_layers": 4,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
   "encoder_attention_heads": 20,
   "mask_time_length": 10,
   "mask_time_min_masks": 2,
   "mask_time_prob": 0.05,
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
   "num_hidden_layers": 32,
   "num_mel_bins": 128,
+  "pad_token_id": 50257,
   "scale_embedding": false,
   "torch_dtype": "float32",
+  "transformers_version": "4.47.0.dev0",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51866

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:2985f36c45745745c7f7c7d5079ae773b534671755a0697ff212fcf45610f3eb
+size 3235581408

runs/Dec05_14-17-07_a35b2528692b/events.out.tfevents.1733408247.a35b2528692b.486.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:cc857b2c53d8a415314cc3465e217cebcc386e3849941d64082a0a93e4f4b99f
+size 14627

tokenizer_config.json CHANGED Viewed

@@ -12987,6 +12987,7 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "<|endoftext|>",
   "errors": "replace",
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<|endoftext|>",
   "processor_class": "WhisperProcessor",

   "clean_up_tokenization_spaces": true,
   "eos_token": "<|endoftext|>",
   "errors": "replace",
+  "extra_special_tokens": {},
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<|endoftext|>",
   "processor_class": "WhisperProcessor",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b782e35f7b12d3a5b7b3a6c3707dc8c3043cd7920f9f081c416cf177a85a4a2
-size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:01e26c2f51a6e826cb4ad97120ecc89360ba3e22e0b7cfde7899f17621125662
+size 5496