pierreguillou
commited on
Commit
•
0c89138
1
Parent(s):
0539d8f
Training in progress, step 6000
Browse files- checkpoint-5400/README.md +0 -1
- {checkpoint-5200 → checkpoint-6000}/config.json +0 -0
- {checkpoint-5200 → checkpoint-6000}/optimizer.pt +1 -1
- {checkpoint-5200 → checkpoint-6000}/pytorch_model.bin +1 -1
- {checkpoint-5200 → checkpoint-6000}/rng_state.pth +1 -1
- {checkpoint-5200 → checkpoint-6000}/scaler.pt +1 -1
- {checkpoint-5200 → checkpoint-6000}/scheduler.pt +1 -1
- {checkpoint-5200 → checkpoint-6000}/sentencepiece.bpe.model +0 -0
- {checkpoint-5200 → checkpoint-6000}/special_tokens_map.json +0 -0
- {checkpoint-5200 → checkpoint-6000}/tokenizer_config.json +0 -0
- {checkpoint-5200 → checkpoint-6000}/trainer_state.json +65 -5
- {checkpoint-5200 → checkpoint-6000}/training_args.bin +1 -1
- pytorch_model.bin +1 -1
- runs/Mar26_08-28-55_341d465657da/events.out.tfevents.1679821115.341d465657da.354.0 +2 -2
checkpoint-5400/README.md
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
f
|
|
|
|
{checkpoint-5200 → checkpoint-6000}/config.json
RENAMED
File without changes
|
{checkpoint-5200 → checkpoint-6000}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2927175013
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1461af1383bb2f63178874b44f042d449b81897e7e55e115154159da8fe49d56
|
3 |
size 2927175013
|
{checkpoint-5200 → checkpoint-6000}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1476527911
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88cf27c21e554578aa6ccc748e607c2e4642f451fa3d2246a9e54c2d740341d3
|
3 |
size 1476527911
|
{checkpoint-5200 → checkpoint-6000}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1dc0de1166af5138e7a8dee1ba212ea993dd8c57ea7c384a4e7dad81ded17ab1
|
3 |
size 14503
|
{checkpoint-5200 → checkpoint-6000}/scaler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 559
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:364aa966969e49bae3723e343aeb08c25d2b519d0a8d04a53a5262a8185d27ec
|
3 |
size 559
|
{checkpoint-5200 → checkpoint-6000}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d9661d23dc74e4d49d288ff40d04214542698769dd49c49616494083a0e77bd
|
3 |
size 623
|
{checkpoint-5200 → checkpoint-6000}/sentencepiece.bpe.model
RENAMED
File without changes
|
{checkpoint-5200 → checkpoint-6000}/special_tokens_map.json
RENAMED
File without changes
|
{checkpoint-5200 → checkpoint-6000}/tokenizer_config.json
RENAMED
File without changes
|
{checkpoint-5200 → checkpoint-6000}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "DocLayNet/layout-xlm-base-finetuned-DocLayNet-base_paragraphs_ml512-v6/checkpoint-
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -378,11 +378,71 @@
|
|
378 |
"eval_samples_per_second": 5.303,
|
379 |
"eval_steps_per_second": 0.333,
|
380 |
"step": 5200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
381 |
}
|
382 |
],
|
383 |
"max_steps": 7504,
|
384 |
"num_train_epochs": 4,
|
385 |
-
"total_flos": 2.
|
386 |
"trial_name": null,
|
387 |
"trial_params": null
|
388 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.7797986932721173,
|
3 |
+
"best_model_checkpoint": "DocLayNet/layout-xlm-base-finetuned-DocLayNet-base_paragraphs_ml512-v6/checkpoint-6000",
|
4 |
+
"epoch": 3.1982942430703627,
|
5 |
+
"global_step": 6000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
378 |
"eval_samples_per_second": 5.303,
|
379 |
"eval_steps_per_second": 0.333,
|
380 |
"step": 5200
|
381 |
+
},
|
382 |
+
{
|
383 |
+
"epoch": 2.88,
|
384 |
+
"eval_accuracy": 0.9724974065363203,
|
385 |
+
"eval_f1": 0.7607919220424181,
|
386 |
+
"eval_loss": 0.12770096957683563,
|
387 |
+
"eval_precision": 0.7864891968274227,
|
388 |
+
"eval_recall": 0.7367207514944492,
|
389 |
+
"eval_runtime": 298.6206,
|
390 |
+
"eval_samples_per_second": 5.381,
|
391 |
+
"eval_steps_per_second": 0.338,
|
392 |
+
"step": 5400
|
393 |
+
},
|
394 |
+
{
|
395 |
+
"epoch": 2.93,
|
396 |
+
"learning_rate": 5.955871464534282e-06,
|
397 |
+
"loss": 0.0432,
|
398 |
+
"step": 5500
|
399 |
+
},
|
400 |
+
{
|
401 |
+
"epoch": 2.99,
|
402 |
+
"eval_accuracy": 0.9692585465516832,
|
403 |
+
"eval_f1": 0.7784317119612255,
|
404 |
+
"eval_loss": 0.15319885313510895,
|
405 |
+
"eval_precision": 0.78908580452711,
|
406 |
+
"eval_recall": 0.7680614859094791,
|
407 |
+
"eval_runtime": 299.3727,
|
408 |
+
"eval_samples_per_second": 5.368,
|
409 |
+
"eval_steps_per_second": 0.337,
|
410 |
+
"step": 5600
|
411 |
+
},
|
412 |
+
{
|
413 |
+
"epoch": 3.09,
|
414 |
+
"eval_accuracy": 0.9691767171633182,
|
415 |
+
"eval_f1": 0.7783425414364641,
|
416 |
+
"eval_loss": 0.1701451987028122,
|
417 |
+
"eval_precision": 0.8066880439761795,
|
418 |
+
"eval_recall": 0.7519214346712212,
|
419 |
+
"eval_runtime": 330.9586,
|
420 |
+
"eval_samples_per_second": 4.856,
|
421 |
+
"eval_steps_per_second": 0.305,
|
422 |
+
"step": 5800
|
423 |
+
},
|
424 |
+
{
|
425 |
+
"epoch": 3.2,
|
426 |
+
"learning_rate": 4.475048126758478e-06,
|
427 |
+
"loss": 0.0272,
|
428 |
+
"step": 6000
|
429 |
+
},
|
430 |
+
{
|
431 |
+
"epoch": 3.2,
|
432 |
+
"eval_accuracy": 0.973239150346983,
|
433 |
+
"eval_f1": 0.7797986932721173,
|
434 |
+
"eval_loss": 0.11586667597293854,
|
435 |
+
"eval_precision": 0.8071650520928533,
|
436 |
+
"eval_recall": 0.7542271562766866,
|
437 |
+
"eval_runtime": 326.8152,
|
438 |
+
"eval_samples_per_second": 4.917,
|
439 |
+
"eval_steps_per_second": 0.309,
|
440 |
+
"step": 6000
|
441 |
}
|
442 |
],
|
443 |
"max_steps": 7504,
|
444 |
"num_train_epochs": 4,
|
445 |
+
"total_flos": 2.5913706725376e+16,
|
446 |
"trial_name": null,
|
447 |
"trial_params": null
|
448 |
}
|
{checkpoint-5200 → checkpoint-6000}/training_args.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3759
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa15259c372902c8706d91a1e90c5ae1b05ee943ad6d35334cb341cb0ae39556
|
3 |
size 3759
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1476527911
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88cf27c21e554578aa6ccc748e607c2e4642f451fa3d2246a9e54c2d740341d3
|
3 |
size 1476527911
|
runs/Mar26_08-28-55_341d465657da/events.out.tfevents.1679821115.341d465657da.354.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eba717486f41fecfab0ea997df086b866e05150e97b355db02590933316c1c64
|
3 |
+
size 7832
|