k4black commited on
Commit
d086b6b
1 Parent(s): f1b41df

Training in progress, step 8500

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbf659a65f9a3c6db040bf88bab53a10d9b0c46fa7280e3b67f9cb74a50e6d3d
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88af33fe8e5306f134e62bf5499f0af9d747c05e5dd3bfe70641a5940d6930a4
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d00b3065b12e27ae9840ccf4e5d5549aaf2f7220310032a5205f90a839065ebd
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0793531568d277d51ce2970f580cae65fe1987a03f245b5b066d6e471e20d87e
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cec724b38bb580d680c039595cf17594fa973d2ae47755369626c19343dda09e
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a51dfbb88117ab22e6f31437680c19642fbab7436c6ca33a16672c64603d2ff9
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb81c75ce18cfc01d028f80ff6cb28745bf4cddf3350cea7d001fea8d2e9bad8
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9bda0aecccd9852ee1800c4d934c39f500d5db7bc34a781b3fc35027e954f8f
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d31c06f4e8f4233900b921d54f3928d17e889534600ddff4a32c5a43a425dfa2
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:010a1b2faa827416c291882f77230dae20f61293663c7d0588d29cfa1fb72ab1
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 0.7643744945526123,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-8000",
4
- "epoch": 2.56,
5
- "global_step": 8000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -310,11 +310,30 @@
310
  "eval_samples_per_second": 91.671,
311
  "eval_steps_per_second": 2.888,
312
  "step": 8000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
313
  }
314
  ],
315
  "max_steps": 31250,
316
  "num_train_epochs": 10,
317
- "total_flos": 2.891269685850931e+16,
318
  "trial_name": null,
319
  "trial_params": null
320
  }
 
1
  {
2
  "best_metric": 0.7643744945526123,
3
  "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-8000",
4
+ "epoch": 2.7199999999999998,
5
+ "global_step": 8500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
310
  "eval_samples_per_second": 91.671,
311
  "eval_steps_per_second": 2.888,
312
  "step": 8000
313
+ },
314
+ {
315
+ "epoch": 2.72,
316
+ "learning_rate": 7.665308047293428e-05,
317
+ "loss": 0.5296,
318
+ "step": 8500
319
+ },
320
+ {
321
+ "epoch": 2.72,
322
+ "eval_bleu": 0.13382829744509098,
323
+ "eval_exact_match": 0.161,
324
+ "eval_loss": 0.7650749683380127,
325
+ "eval_rouge1": 0.5692675142813927,
326
+ "eval_rouge2": 0.4018288384287947,
327
+ "eval_rougeL": 0.5521131597944772,
328
+ "eval_runtime": 21.7709,
329
+ "eval_samples_per_second": 91.866,
330
+ "eval_steps_per_second": 2.894,
331
+ "step": 8500
332
  }
333
  ],
334
  "max_steps": 31250,
335
  "num_train_epochs": 10,
336
+ "total_flos": 3.0721979896037376e+16,
337
  "trial_name": null,
338
  "trial_params": null
339
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d00b3065b12e27ae9840ccf4e5d5549aaf2f7220310032a5205f90a839065ebd
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0793531568d277d51ce2970f580cae65fe1987a03f245b5b066d6e471e20d87e
3
  size 242019067