k4black commited on
Commit
35cb6bb
·
1 Parent(s): c067a76

Training in progress, step 14000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54eb609d9e7c9af8da5e499842252b44866540b8464e813675b437dafad687b2
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c23b69b59897ebc9a97c19bd2a902bb18a26d887e62ee33ac8b4f293e0af7d4
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30184e0248c24f3d379731864a3d98181dd0e082ff4728e8eb1473d646421010
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9495204942412434228c388914178dbe63163b5e4a568c01df18f671c0ee1d6e
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a75063c2eccccee16964972d0c16700ba598e8ad046be88de665bdc4e411e739
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e8f7efa9426f92d7539e42fac5262290109f255d1efd558300073dd9b1757e3
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0285090586e6ad2f57d9d2e587707107a6deb19c653c72063c13e57720ea6b1e
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcbebf584d95d5940548f6516feb8fd6cb40baa6100b67cbab5a1e566f16d2f1
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26b34eea6aaf93230bd2195d19b94a8c538e2fb1720b246af9cbe4988634461c
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e42904a0588b80a1634b5dc0bcc0efd6bdf97c38cd332e0d2726fb589ae18ccb
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 1.528552770614624,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship-repr/results/Salesforce-codet5-small-java-small-selected-wo-tokens/checkpoint-2000",
4
- "epoch": 1.6645859342488556,
5
- "global_step": 12000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -114,11 +114,29 @@
114
  "eval_samples_per_second": 144.961,
115
  "eval_steps_per_second": 1.514,
116
  "step": 12000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
117
  }
118
  ],
119
  "max_steps": 36045,
120
  "num_train_epochs": 5,
121
- "total_flos": 1.5590157453361152e+17,
122
  "trial_name": null,
123
  "trial_params": null
124
  }
 
1
  {
2
  "best_metric": 1.528552770614624,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship-repr/results/Salesforce-codet5-small-java-small-selected-wo-tokens/checkpoint-2000",
4
+ "epoch": 1.9420169232903315,
5
+ "global_step": 14000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
114
  "eval_samples_per_second": 144.961,
115
  "eval_steps_per_second": 1.514,
116
  "step": 12000
117
+ },
118
+ {
119
+ "epoch": 1.94,
120
+ "learning_rate": 6.440044389930495e-05,
121
+ "loss": 1.0027,
122
+ "step": 14000
123
+ },
124
+ {
125
+ "epoch": 1.94,
126
+ "eval_exact_match": 0.3238550578761953,
127
+ "eval_loss": 1.5750421285629272,
128
+ "eval_rouge1": 0.5206336041126007,
129
+ "eval_rouge2": 0.24470678869584325,
130
+ "eval_rougeL": 0.5202257107678057,
131
+ "eval_runtime": 161.6161,
132
+ "eval_samples_per_second": 147.535,
133
+ "eval_steps_per_second": 1.541,
134
+ "step": 14000
135
  }
136
  ],
137
  "max_steps": 36045,
138
  "num_train_epochs": 5,
139
+ "total_flos": 1.8188720041623552e+17,
140
  "trial_name": null,
141
  "trial_params": null
142
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30184e0248c24f3d379731864a3d98181dd0e082ff4728e8eb1473d646421010
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9495204942412434228c388914178dbe63163b5e4a568c01df18f671c0ee1d6e
3
  size 242019067