Maniac commited on
Commit
ad0da0e
1 Parent(s): a6df0e4

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 666.67,
3
+ "eval_loss": 3.8433420658111572,
4
+ "eval_runtime": 5.4398,
5
+ "eval_samples": 142,
6
+ "eval_samples_per_second": 26.104,
7
+ "eval_steps_per_second": 3.309,
8
+ "eval_wer": 0.985178727114211,
9
+ "train_loss": 0.3888468391895294,
10
+ "train_runtime": 14986.9731,
11
+ "train_samples": 378,
12
+ "train_samples_per_second": 17.082,
13
+ "train_steps_per_second": 0.133
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 666.67,
3
+ "eval_loss": 3.8433420658111572,
4
+ "eval_runtime": 5.4398,
5
+ "eval_samples": 142,
6
+ "eval_samples_per_second": 26.104,
7
+ "eval_steps_per_second": 3.309,
8
+ "eval_wer": 0.985178727114211
9
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69a45d2822bb91bb974d2b31bca68deb636d59da4ce6e50856a6d192d1bccd6f
3
  size 1262149169
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c682e1bb0700134f686d26b075c5572f761a09b187c8e8a9acacbbba67037762
3
  size 1262149169
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 666.67,
3
+ "train_loss": 0.3888468391895294,
4
+ "train_runtime": 14986.9731,
5
+ "train_samples": 378,
6
+ "train_samples_per_second": 17.082,
7
+ "train_steps_per_second": 0.133
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 666.6666666666666,
5
+ "global_step": 2000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 166.67,
12
+ "learning_rate": 0.00022529999999999997,
13
+ "loss": 1.468,
14
+ "step": 500
15
+ },
16
+ {
17
+ "epoch": 166.67,
18
+ "eval_loss": 3.02618145942688,
19
+ "eval_runtime": 5.3514,
20
+ "eval_samples_per_second": 26.535,
21
+ "eval_steps_per_second": 3.364,
22
+ "eval_wer": 1.003487358326068,
23
+ "step": 500
24
+ },
25
+ {
26
+ "epoch": 333.33,
27
+ "learning_rate": 0.0001503,
28
+ "loss": 0.0572,
29
+ "step": 1000
30
+ },
31
+ {
32
+ "epoch": 333.33,
33
+ "eval_loss": 3.535200834274292,
34
+ "eval_runtime": 5.4028,
35
+ "eval_samples_per_second": 26.283,
36
+ "eval_steps_per_second": 3.332,
37
+ "eval_wer": 0.972101133391456,
38
+ "step": 1000
39
+ },
40
+ {
41
+ "epoch": 500.0,
42
+ "learning_rate": 7.529999999999999e-05,
43
+ "loss": 0.0209,
44
+ "step": 1500
45
+ },
46
+ {
47
+ "epoch": 500.0,
48
+ "eval_loss": 3.726599931716919,
49
+ "eval_runtime": 5.4408,
50
+ "eval_samples_per_second": 26.099,
51
+ "eval_steps_per_second": 3.308,
52
+ "eval_wer": 0.983435047951177,
53
+ "step": 1500
54
+ },
55
+ {
56
+ "epoch": 666.67,
57
+ "learning_rate": 3e-07,
58
+ "loss": 0.0092,
59
+ "step": 2000
60
+ },
61
+ {
62
+ "epoch": 666.67,
63
+ "eval_loss": 3.8433420658111572,
64
+ "eval_runtime": 5.3563,
65
+ "eval_samples_per_second": 26.511,
66
+ "eval_steps_per_second": 3.361,
67
+ "eval_wer": 0.985178727114211,
68
+ "step": 2000
69
+ },
70
+ {
71
+ "epoch": 666.67,
72
+ "step": 2000,
73
+ "total_flos": 5.0698303474476155e+19,
74
+ "train_loss": 0.3888468391895294,
75
+ "train_runtime": 14986.9731,
76
+ "train_samples_per_second": 17.082,
77
+ "train_steps_per_second": 0.133
78
+ }
79
+ ],
80
+ "max_steps": 2000,
81
+ "num_train_epochs": 667,
82
+ "total_flos": 5.0698303474476155e+19,
83
+ "trial_name": null,
84
+ "trial_params": null
85
+ }