SuperSecureHuman
commited on
Commit
β’
00879ce
1
Parent(s):
9305420
Training in progress, step 20
Browse files- {checkpoint-5 β checkpoint-10}/config.json +0 -0
- {checkpoint-5 β checkpoint-10}/optimizer.pt +1 -1
- {checkpoint-5 β checkpoint-10}/pytorch_model.bin +1 -1
- {checkpoint-5 β checkpoint-10}/rng_state.pth +1 -1
- {checkpoint-5 β checkpoint-10}/scheduler.pt +1 -1
- {checkpoint-5 β checkpoint-10}/trainer_state.json +14 -5
- {checkpoint-5 β checkpoint-10}/training_args.bin +0 -0
- checkpoint-15/config.json +41 -0
- checkpoint-15/optimizer.pt +3 -0
- checkpoint-15/pytorch_model.bin +3 -0
- checkpoint-15/rng_state.pth +3 -0
- checkpoint-15/scheduler.pt +3 -0
- checkpoint-15/trainer_state.json +43 -0
- checkpoint-15/training_args.bin +3 -0
- checkpoint-20/config.json +41 -0
- checkpoint-20/optimizer.pt +3 -0
- checkpoint-20/pytorch_model.bin +3 -0
- checkpoint-20/rng_state.pth +3 -0
- checkpoint-20/scheduler.pt +3 -0
- checkpoint-20/trainer_state.json +52 -0
- checkpoint-20/training_args.bin +3 -0
- pytorch_model.bin +1 -1
- runs/Aug01_08-59-35_bf9c8dab34e2/events.out.tfevents.1690880484.bf9c8dab34e2.4319.0 +2 -2
{checkpoint-5 β checkpoint-10}/config.json
RENAMED
File without changes
|
{checkpoint-5 β checkpoint-10}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 866630597
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5048ccd942c1fa8f84859abf13b3def087a58f67d403eb31ee5407850c2b73f0
|
3 |
size 866630597
|
{checkpoint-5 β checkpoint-10}/pytorch_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 433324849
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7663ee471abdc67aeda453f03e899ec561cb8b9163487ab6582d533f1aabe344
|
3 |
size 433324849
|
{checkpoint-5 β checkpoint-10}/rng_state.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19791385e49273a511907444b1ae61a0fb564d72d6c2f39e93faa8ba412a08bc
|
3 |
size 14575
|
{checkpoint-5 β checkpoint-10}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:300c86a2aa6e26efba7d9b0a68e362b00d4b32a365582d4ca0f1da2b053f668a
|
3 |
size 627
|
{checkpoint-5 β checkpoint-10}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 0.
|
3 |
-
"best_model_checkpoint": "./trainer_test_checkpoint/checkpoint-
|
4 |
-
"epoch": 0.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -15,11 +15,20 @@
|
|
15 |
"eval_samples_per_second": 28.444,
|
16 |
"eval_steps_per_second": 14.222,
|
17 |
"step": 5
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
18 |
}
|
19 |
],
|
20 |
"max_steps": 100,
|
21 |
"num_train_epochs": 2,
|
22 |
-
"total_flos":
|
23 |
"trial_name": null,
|
24 |
"trial_params": null
|
25 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 0.25,
|
3 |
+
"best_model_checkpoint": "./trainer_test_checkpoint/checkpoint-10",
|
4 |
+
"epoch": 0.2,
|
5 |
+
"global_step": 10,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
15 |
"eval_samples_per_second": 28.444,
|
16 |
"eval_steps_per_second": 14.222,
|
17 |
"step": 5
|
18 |
+
},
|
19 |
+
{
|
20 |
+
"epoch": 0.2,
|
21 |
+
"eval_accuracy": 0.25,
|
22 |
+
"eval_loss": 1.7874902486801147,
|
23 |
+
"eval_runtime": 3.5523,
|
24 |
+
"eval_samples_per_second": 28.15,
|
25 |
+
"eval_steps_per_second": 14.075,
|
26 |
+
"step": 10
|
27 |
}
|
28 |
],
|
29 |
"max_steps": 100,
|
30 |
"num_train_epochs": 2,
|
31 |
+
"total_flos": 5262362849280.0,
|
32 |
"trial_name": null,
|
33 |
"trial_params": null
|
34 |
}
|
{checkpoint-5 β checkpoint-10}/training_args.bin
RENAMED
File without changes
|
checkpoint-15/config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "bert-base-cased",
|
3 |
+
"architectures": [
|
4 |
+
"BertForSequenceClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"gradient_checkpointing": false,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"id2label": {
|
13 |
+
"0": "LABEL_0",
|
14 |
+
"1": "LABEL_1",
|
15 |
+
"2": "LABEL_2",
|
16 |
+
"3": "LABEL_3",
|
17 |
+
"4": "LABEL_4"
|
18 |
+
},
|
19 |
+
"initializer_range": 0.02,
|
20 |
+
"intermediate_size": 3072,
|
21 |
+
"label2id": {
|
22 |
+
"LABEL_0": 0,
|
23 |
+
"LABEL_1": 1,
|
24 |
+
"LABEL_2": 2,
|
25 |
+
"LABEL_3": 3,
|
26 |
+
"LABEL_4": 4
|
27 |
+
},
|
28 |
+
"layer_norm_eps": 1e-12,
|
29 |
+
"max_position_embeddings": 512,
|
30 |
+
"model_type": "bert",
|
31 |
+
"num_attention_heads": 12,
|
32 |
+
"num_hidden_layers": 12,
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"position_embedding_type": "absolute",
|
35 |
+
"problem_type": "single_label_classification",
|
36 |
+
"torch_dtype": "float32",
|
37 |
+
"transformers_version": "4.31.0",
|
38 |
+
"type_vocab_size": 2,
|
39 |
+
"use_cache": true,
|
40 |
+
"vocab_size": 28996
|
41 |
+
}
|
checkpoint-15/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ba475c8d36049d825dc710ded8480d6d8fae3b32e0490f721ed506ed88a2da9
|
3 |
+
size 866630597
|
checkpoint-15/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73546efd274884c910649f24f056089ff97f31d0bf3f3b12ed86f615860f3ac8
|
3 |
+
size 433324849
|
checkpoint-15/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f76d54f18626b1e6a8c0c08bd80df27682d642ae62e823afbd857e1580073ffe
|
3 |
+
size 14575
|
checkpoint-15/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1342d5172800147e9ebe25b8a1c9f4694b69157df8117f38d3567999ad3a36e5
|
3 |
+
size 627
|
checkpoint-15/trainer_state.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.25,
|
3 |
+
"best_model_checkpoint": "./trainer_test_checkpoint/checkpoint-10",
|
4 |
+
"epoch": 0.3,
|
5 |
+
"global_step": 15,
|
6 |
+
"is_hyper_param_search": false,
|
7 |
+
"is_local_process_zero": true,
|
8 |
+
"is_world_process_zero": true,
|
9 |
+
"log_history": [
|
10 |
+
{
|
11 |
+
"epoch": 0.1,
|
12 |
+
"eval_accuracy": 0.17,
|
13 |
+
"eval_loss": 1.7631263732910156,
|
14 |
+
"eval_runtime": 3.5157,
|
15 |
+
"eval_samples_per_second": 28.444,
|
16 |
+
"eval_steps_per_second": 14.222,
|
17 |
+
"step": 5
|
18 |
+
},
|
19 |
+
{
|
20 |
+
"epoch": 0.2,
|
21 |
+
"eval_accuracy": 0.25,
|
22 |
+
"eval_loss": 1.7874902486801147,
|
23 |
+
"eval_runtime": 3.5523,
|
24 |
+
"eval_samples_per_second": 28.15,
|
25 |
+
"eval_steps_per_second": 14.075,
|
26 |
+
"step": 10
|
27 |
+
},
|
28 |
+
{
|
29 |
+
"epoch": 0.3,
|
30 |
+
"eval_accuracy": 0.2,
|
31 |
+
"eval_loss": 1.7714591026306152,
|
32 |
+
"eval_runtime": 5.4717,
|
33 |
+
"eval_samples_per_second": 18.276,
|
34 |
+
"eval_steps_per_second": 9.138,
|
35 |
+
"step": 15
|
36 |
+
}
|
37 |
+
],
|
38 |
+
"max_steps": 100,
|
39 |
+
"num_train_epochs": 2,
|
40 |
+
"total_flos": 7893544273920.0,
|
41 |
+
"trial_name": null,
|
42 |
+
"trial_params": null
|
43 |
+
}
|
checkpoint-15/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f994e774f37ded33f3ebe64d3be2318670c8aaf6b944d3b012a125b991f2869c
|
3 |
+
size 3963
|
checkpoint-20/config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "bert-base-cased",
|
3 |
+
"architectures": [
|
4 |
+
"BertForSequenceClassification"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"gradient_checkpointing": false,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"id2label": {
|
13 |
+
"0": "LABEL_0",
|
14 |
+
"1": "LABEL_1",
|
15 |
+
"2": "LABEL_2",
|
16 |
+
"3": "LABEL_3",
|
17 |
+
"4": "LABEL_4"
|
18 |
+
},
|
19 |
+
"initializer_range": 0.02,
|
20 |
+
"intermediate_size": 3072,
|
21 |
+
"label2id": {
|
22 |
+
"LABEL_0": 0,
|
23 |
+
"LABEL_1": 1,
|
24 |
+
"LABEL_2": 2,
|
25 |
+
"LABEL_3": 3,
|
26 |
+
"LABEL_4": 4
|
27 |
+
},
|
28 |
+
"layer_norm_eps": 1e-12,
|
29 |
+
"max_position_embeddings": 512,
|
30 |
+
"model_type": "bert",
|
31 |
+
"num_attention_heads": 12,
|
32 |
+
"num_hidden_layers": 12,
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"position_embedding_type": "absolute",
|
35 |
+
"problem_type": "single_label_classification",
|
36 |
+
"torch_dtype": "float32",
|
37 |
+
"transformers_version": "4.31.0",
|
38 |
+
"type_vocab_size": 2,
|
39 |
+
"use_cache": true,
|
40 |
+
"vocab_size": 28996
|
41 |
+
}
|
checkpoint-20/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b750a1285cf5d7330e810312588bf1673397d3409d08adf477c6d477a3f8648
|
3 |
+
size 866630597
|
checkpoint-20/pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0daebb71a520050584a0bd9e86481eb4fc646f7ea888e9af22035e1cca5702e6
|
3 |
+
size 433324849
|
checkpoint-20/rng_state.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c77f772a2ba9b5c0359e4c7dbaf1704b9f015e0cf13e2cc0d1557ec51f97467
|
3 |
+
size 14575
|
checkpoint-20/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee02d9816945c904e881ed0c62a97354f538c50c767dfe7cddb585bcb191b22d
|
3 |
+
size 627
|
checkpoint-20/trainer_state.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": 0.25,
|
3 |
+
"best_model_checkpoint": "./trainer_test_checkpoint/checkpoint-10",
|
4 |
+
"epoch": 0.4,
|
5 |
+
"global_step": 20,
|
6 |
+
"is_hyper_param_search": false,
|
7 |
+
"is_local_process_zero": true,
|
8 |
+
"is_world_process_zero": true,
|
9 |
+
"log_history": [
|
10 |
+
{
|
11 |
+
"epoch": 0.1,
|
12 |
+
"eval_accuracy": 0.17,
|
13 |
+
"eval_loss": 1.7631263732910156,
|
14 |
+
"eval_runtime": 3.5157,
|
15 |
+
"eval_samples_per_second": 28.444,
|
16 |
+
"eval_steps_per_second": 14.222,
|
17 |
+
"step": 5
|
18 |
+
},
|
19 |
+
{
|
20 |
+
"epoch": 0.2,
|
21 |
+
"eval_accuracy": 0.25,
|
22 |
+
"eval_loss": 1.7874902486801147,
|
23 |
+
"eval_runtime": 3.5523,
|
24 |
+
"eval_samples_per_second": 28.15,
|
25 |
+
"eval_steps_per_second": 14.075,
|
26 |
+
"step": 10
|
27 |
+
},
|
28 |
+
{
|
29 |
+
"epoch": 0.3,
|
30 |
+
"eval_accuracy": 0.2,
|
31 |
+
"eval_loss": 1.7714591026306152,
|
32 |
+
"eval_runtime": 5.4717,
|
33 |
+
"eval_samples_per_second": 18.276,
|
34 |
+
"eval_steps_per_second": 9.138,
|
35 |
+
"step": 15
|
36 |
+
},
|
37 |
+
{
|
38 |
+
"epoch": 0.4,
|
39 |
+
"eval_accuracy": 0.2,
|
40 |
+
"eval_loss": 1.7414228916168213,
|
41 |
+
"eval_runtime": 3.5124,
|
42 |
+
"eval_samples_per_second": 28.47,
|
43 |
+
"eval_steps_per_second": 14.235,
|
44 |
+
"step": 20
|
45 |
+
}
|
46 |
+
],
|
47 |
+
"max_steps": 100,
|
48 |
+
"num_train_epochs": 2,
|
49 |
+
"total_flos": 10524725698560.0,
|
50 |
+
"trial_name": null,
|
51 |
+
"trial_params": null
|
52 |
+
}
|
checkpoint-20/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f994e774f37ded33f3ebe64d3be2318670c8aaf6b944d3b012a125b991f2869c
|
3 |
+
size 3963
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 433324849
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0daebb71a520050584a0bd9e86481eb4fc646f7ea888e9af22035e1cca5702e6
|
3 |
size 433324849
|
runs/Aug01_08-59-35_bf9c8dab34e2/events.out.tfevents.1690880484.bf9c8dab34e2.4319.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d603590c421b8ccf248f628cbf3f8941e0e00bc2543c3ef99689d9fdb6289aea
|
3 |
+
size 5564
|