k4black commited on
Commit
1a906dd
1 Parent(s): d086b6b

Training in progress, step 9000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88af33fe8e5306f134e62bf5499f0af9d747c05e5dd3bfe70641a5940d6930a4
3
  size 484059375
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00f371231c36791b38dd89092a64e366dd58b671d444922dde4998574869274a
3
  size 484059375
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0793531568d277d51ce2970f580cae65fe1987a03f245b5b066d6e471e20d87e
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f18937662a859ff6e78c5422df2113b523dbfd7b7f91be18cb13250063a5e03
3
  size 242019067
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a51dfbb88117ab22e6f31437680c19642fbab7436c6ca33a16672c64603d2ff9
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd9dfd2b668d498514c4957117c1d874e1ccc4cc4890ffb1a77585c12f80cd8e
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9bda0aecccd9852ee1800c4d934c39f500d5db7bc34a781b3fc35027e954f8f
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83908742b3f4513cfd0e74b4f711b13f11ccb972c2d6ebf61778d4a4d13e30eb
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:010a1b2faa827416c291882f77230dae20f61293663c7d0588d29cfa1fb72ab1
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b76fe3f533d8bee2b12633a432289bbe1cbc4f2c09860cdf067c3155a68af8bf
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.7643744945526123,
3
- "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-8000",
4
- "epoch": 2.7199999999999998,
5
- "global_step": 8500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -329,11 +329,30 @@
329
  "eval_samples_per_second": 91.866,
330
  "eval_steps_per_second": 2.894,
331
  "step": 8500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
332
  }
333
  ],
334
  "max_steps": 31250,
335
  "num_train_epochs": 10,
336
- "total_flos": 3.0721979896037376e+16,
337
  "trial_name": null,
338
  "trial_params": null
339
  }
 
1
  {
2
+ "best_metric": 0.7636184096336365,
3
+ "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-9000",
4
+ "epoch": 2.88,
5
+ "global_step": 9000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
329
  "eval_samples_per_second": 91.866,
330
  "eval_steps_per_second": 2.894,
331
  "step": 8500
332
+ },
333
+ {
334
+ "epoch": 2.88,
335
+ "learning_rate": 7.496884158048978e-05,
336
+ "loss": 0.5343,
337
+ "step": 9000
338
+ },
339
+ {
340
+ "epoch": 2.88,
341
+ "eval_bleu": 0.1355027033693307,
342
+ "eval_exact_match": 0.1635,
343
+ "eval_loss": 0.7636184096336365,
344
+ "eval_rouge1": 0.5679441721859034,
345
+ "eval_rouge2": 0.4050592356179844,
346
+ "eval_rougeL": 0.5514489474326643,
347
+ "eval_runtime": 21.8929,
348
+ "eval_samples_per_second": 91.354,
349
+ "eval_steps_per_second": 2.878,
350
+ "step": 9000
351
  }
352
  ],
353
  "max_steps": 31250,
354
  "num_train_epochs": 10,
355
+ "total_flos": 3.251577475615949e+16,
356
  "trial_name": null,
357
  "trial_params": null
358
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0793531568d277d51ce2970f580cae65fe1987a03f245b5b066d6e471e20d87e
3
  size 242019067
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f18937662a859ff6e78c5422df2113b523dbfd7b7f91be18cb13250063a5e03
3
  size 242019067