ibrahimj commited on
Commit
5f67028
1 Parent(s): 40422f7

Training in progress, step 36000

Browse files
all_results.json CHANGED
@@ -5,8 +5,8 @@
5
  "eval_samples_per_second": 0.81,
6
  "eval_steps_per_second": 0.203,
7
  "eval_wer": 29.205723913714138,
8
- "train_loss": 0.7804906897136143,
9
- "train_runtime": 406099.0091,
10
- "train_samples_per_second": 0.689,
11
- "train_steps_per_second": 0.086
12
  }
 
5
  "eval_samples_per_second": 0.81,
6
  "eval_steps_per_second": 0.203,
7
  "eval_wer": 29.205723913714138,
8
+ "train_loss": 1.5390448555129346e-05,
9
+ "train_runtime": 6.8399,
10
+ "train_samples_per_second": 40936.549,
11
+ "train_steps_per_second": 5117.069
12
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ad2bde5feeaec1a9101e1776c6370a1ba226a08d8ed0cbf0fdd980af2ad1150
3
  size 4936567968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2793cdc0144994fe021fe306cd3dab078f8e2a27184dc7a8734c2650705c9db5
3
  size 4936567968
runs/Feb04_08-43-21_ip-10-0-3-5.eu-west-1.compute.internal/events.out.tfevents.1707036244.ip-10-0-3-5.eu-west-1.compute.internal.10679.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11a6a682062abf19d149cbf3e928b6f72a7b99231e75383176c59544e5e7a8a9
3
+ size 11942
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 0.18,
3
- "train_loss": 0.7804906897136143,
4
- "train_runtime": 406099.0091,
5
- "train_samples_per_second": 0.689,
6
- "train_steps_per_second": 0.086
7
  }
 
1
  {
2
  "epoch": 0.18,
3
+ "train_loss": 1.5390448555129346e-05,
4
+ "train_runtime": 6.8399,
5
+ "train_samples_per_second": 40936.549,
6
+ "train_steps_per_second": 5117.069
7
  }
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 29.205723913714138,
3
  "best_model_checkpoint": "./hamsa-pretrained/checkpoint-35000",
4
- "epoch": 0.17544035529178237,
5
  "eval_steps": 1000,
6
- "global_step": 35000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -8725,12 +8725,12 @@
8725
  },
8726
  {
8727
  "epoch": 0.18,
8728
- "step": 35000,
8729
- "total_flos": 4.753690066944e+20,
8730
- "train_loss": 0.7804906897136143,
8731
- "train_runtime": 406099.0091,
8732
- "train_samples_per_second": 0.689,
8733
- "train_steps_per_second": 0.086
8734
  }
8735
  ],
8736
  "logging_steps": 25,
@@ -8738,7 +8738,7 @@
8738
  "num_input_tokens_seen": 0,
8739
  "num_train_epochs": 1,
8740
  "save_steps": 1000,
8741
- "total_flos": 4.753690066944e+20,
8742
  "train_batch_size": 8,
8743
  "trial_name": null,
8744
  "trial_params": null
 
1
  {
2
  "best_metric": 29.205723913714138,
3
  "best_model_checkpoint": "./hamsa-pretrained/checkpoint-35000",
4
+ "epoch": 0.17544536787336215,
5
  "eval_steps": 1000,
6
+ "global_step": 35001,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
8725
  },
8726
  {
8727
  "epoch": 0.18,
8728
+ "step": 35001,
8729
+ "total_flos": 4.7538258866601984e+20,
8730
+ "train_loss": 1.5390448555129346e-05,
8731
+ "train_runtime": 6.8399,
8732
+ "train_samples_per_second": 40936.549,
8733
+ "train_steps_per_second": 5117.069
8734
  }
8735
  ],
8736
  "logging_steps": 25,
 
8738
  "num_input_tokens_seen": 0,
8739
  "num_train_epochs": 1,
8740
  "save_steps": 1000,
8741
+ "total_flos": 4.7538258866601984e+20,
8742
  "train_batch_size": 8,
8743
  "trial_name": null,
8744
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bac3075244d6d9afe4f493d1fbf75070decb9ab6fd1bd6f21224543f2e1206e0
3
  size 4856
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74b9e93f07ccec52bc6245b5cb3e4e9324c69da5b5fc95cb33c1098eb297b715
3
  size 4856