Training in progress, step 100
Browse files- all_results.json +14 -0
- config.json +0 -1
- eval_results.json +9 -0
- model.safetensors +1 -1
- runs/Mar26_14-58-24_ryanserver/events.out.tfevents.1711479509.ryanserver.32336.0 +2 -2
- runs/Mar26_19-10-31_ryanserver/events.out.tfevents.1711494636.ryanserver.23284.0 +3 -0
- runs/Mar26_19-10-31_ryanserver/events.out.tfevents.1711494727.ryanserver.23284.1 +3 -0
- runs/Mar26_19-25-15_ryanserver/events.out.tfevents.1711495521.ryanserver.25139.0 +3 -0
- runs/Mar26_19-28-27_ryanserver/events.out.tfevents.1711495712.ryanserver.25639.0 +3 -0
- runs/Mar26_19-31-04_ryanserver/events.out.tfevents.1711495870.ryanserver.26081.0 +3 -0
- runs/Mar26_19-32-15_ryanserver/events.out.tfevents.1711495940.ryanserver.26465.0 +3 -0
- runs/Mar26_19-33-53_ryanserver/events.out.tfevents.1711496039.ryanserver.26772.0 +3 -0
- runs/Mar26_19-33-53_ryanserver/events.out.tfevents.1711496133.ryanserver.26772.1 +3 -0
- runs/Mar26_19-36-12_ryanserver/events.out.tfevents.1711496178.ryanserver.27395.0 +3 -0
- runs/Mar26_19-37-43_ryanserver/events.out.tfevents.1711496268.ryanserver.27980.0 +3 -0
- runs/Mar26_19-37-43_ryanserver/events.out.tfevents.1711496360.ryanserver.27980.1 +3 -0
- runs/Mar26_19-43-54_ryanserver/events.out.tfevents.1711496640.ryanserver.29072.0 +3 -0
- runs/Mar26_19-46-27_ryanserver/events.out.tfevents.1711496793.ryanserver.29921.0 +3 -0
- train_results.json +7 -0
- trainer_state.json +72 -0
- training_args.bin +1 -1
all_results.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 4.0,
|
3 |
+
"eval_accuracy": 0.628,
|
4 |
+
"eval_loss": 0.29625898599624634,
|
5 |
+
"eval_na_accuracy": 0.952,
|
6 |
+
"eval_ordinal_accuracy": 0.5119617224880383,
|
7 |
+
"eval_runtime": 23.9544,
|
8 |
+
"eval_samples_per_second": 10.437,
|
9 |
+
"eval_steps_per_second": 1.336,
|
10 |
+
"train_loss": 0.2629110822454095,
|
11 |
+
"train_runtime": 64.8307,
|
12 |
+
"train_samples_per_second": 15.425,
|
13 |
+
"train_steps_per_second": 0.987
|
14 |
+
}
|
config.json
CHANGED
@@ -33,7 +33,6 @@
|
|
33 |
"num_channels": 3,
|
34 |
"num_hidden_layers": 12,
|
35 |
"patch_size": 16,
|
36 |
-
"problem_type": "single_label_classification",
|
37 |
"qkv_bias": true,
|
38 |
"torch_dtype": "float32",
|
39 |
"transformers_version": "4.39.1"
|
|
|
33 |
"num_channels": 3,
|
34 |
"num_hidden_layers": 12,
|
35 |
"patch_size": 16,
|
|
|
36 |
"qkv_bias": true,
|
37 |
"torch_dtype": "float32",
|
38 |
"transformers_version": "4.39.1"
|
eval_results.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 4.0,
|
3 |
+
"eval_loss": 0.29625898599624634,
|
4 |
+
"eval_na_accuracy": 0.952,
|
5 |
+
"eval_ordinal_accuracy": 0.5119617224880383,
|
6 |
+
"eval_runtime": 23.9544,
|
7 |
+
"eval_samples_per_second": 10.437,
|
8 |
+
"eval_steps_per_second": 1.336
|
9 |
+
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 343236280
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf2a83d4c2644656305ccfed5a16acb6df1a780913707576cf644f8b5d572f9c
|
3 |
size 343236280
|
runs/Mar26_14-58-24_ryanserver/events.out.tfevents.1711479509.ryanserver.32336.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec4d0102002d51eda240637a797f0a719ad52c709701cac1570766fb4d2579c3
|
3 |
+
size 62332
|
runs/Mar26_19-10-31_ryanserver/events.out.tfevents.1711494636.ryanserver.23284.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b82328efd0105e79552c132bf8bad5be051abc122a6e1ec34f6131ff28775b3
|
3 |
+
size 6330
|
runs/Mar26_19-10-31_ryanserver/events.out.tfevents.1711494727.ryanserver.23284.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f0444e685ec2085c37c89b39baa78d0b801c510a0db15c413579935fb412308
|
3 |
+
size 405
|
runs/Mar26_19-25-15_ryanserver/events.out.tfevents.1711495521.ryanserver.25139.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:493797501022b6f85e8a6b06948937e985d47d79b3c26402a8296e296cb963de
|
3 |
+
size 4740
|
runs/Mar26_19-28-27_ryanserver/events.out.tfevents.1711495712.ryanserver.25639.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42021a17c5908eba1ec4fce7c4ffbf72d8ac879ac50942749c1b025c4cf82c58
|
3 |
+
size 4740
|
runs/Mar26_19-31-04_ryanserver/events.out.tfevents.1711495870.ryanserver.26081.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2221f13b60df622c59e3e32eb10577023a8031184cfd40fdf91743c67324b3b
|
3 |
+
size 4740
|
runs/Mar26_19-32-15_ryanserver/events.out.tfevents.1711495940.ryanserver.26465.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20790bd1a99748a795b63502ab796ef664bccba4e042fdf76342204f77db6119
|
3 |
+
size 4740
|
runs/Mar26_19-33-53_ryanserver/events.out.tfevents.1711496039.ryanserver.26772.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00d742c55b1f589100044e29ca10f17d462e8e10b9ae20e8323c8441e06d3239
|
3 |
+
size 6330
|
runs/Mar26_19-33-53_ryanserver/events.out.tfevents.1711496133.ryanserver.26772.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:624c69bda61ee7fa12011a7445ae3fc0267ada1e07d3013c347407efbe31b0a2
|
3 |
+
size 467
|
runs/Mar26_19-36-12_ryanserver/events.out.tfevents.1711496178.ryanserver.27395.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a00ca42036b5a2604a4754e4f6da268e05d1e6033dc97a0a428d3c0c1ae9c059
|
3 |
+
size 6330
|
runs/Mar26_19-37-43_ryanserver/events.out.tfevents.1711496268.ryanserver.27980.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86d5d17cf9e8c478c18c12a457b6db88b117a5d42b917cfe85833e44caea5511
|
3 |
+
size 6330
|
runs/Mar26_19-37-43_ryanserver/events.out.tfevents.1711496360.ryanserver.27980.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cea47e3ed4ab483c607ce165a2226c341591db85fbfc59376afd5e6a0a699f04
|
3 |
+
size 467
|
runs/Mar26_19-43-54_ryanserver/events.out.tfevents.1711496640.ryanserver.29072.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:533e4e07d40a966e3b74fe73bc9ce6bd642f516b4bc0ed42af0002d0e1c28b25
|
3 |
+
size 6809
|
runs/Mar26_19-46-27_ryanserver/events.out.tfevents.1711496793.ryanserver.29921.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d302da5e90bf108aced3d782e3aa4c7eef0cf1b857020f0639e645a7055a311d
|
3 |
+
size 7188
|
train_results.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"epoch": 4.0,
|
3 |
+
"train_loss": 0.2629110822454095,
|
4 |
+
"train_runtime": 64.8307,
|
5 |
+
"train_samples_per_second": 15.425,
|
6 |
+
"train_steps_per_second": 0.987
|
7 |
+
}
|
trainer_state.json
ADDED
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"best_metric": null,
|
3 |
+
"best_model_checkpoint": null,
|
4 |
+
"epoch": 4.0,
|
5 |
+
"eval_steps": 100,
|
6 |
+
"global_step": 64,
|
7 |
+
"is_hyper_param_search": false,
|
8 |
+
"is_local_process_zero": true,
|
9 |
+
"is_world_process_zero": true,
|
10 |
+
"log_history": [
|
11 |
+
{
|
12 |
+
"epoch": 0.62,
|
13 |
+
"grad_norm": 1.1892509460449219,
|
14 |
+
"learning_rate": 0.00016875,
|
15 |
+
"loss": 0.5447,
|
16 |
+
"step": 10
|
17 |
+
},
|
18 |
+
{
|
19 |
+
"epoch": 1.25,
|
20 |
+
"grad_norm": 1.315897822380066,
|
21 |
+
"learning_rate": 0.0001375,
|
22 |
+
"loss": 0.408,
|
23 |
+
"step": 20
|
24 |
+
},
|
25 |
+
{
|
26 |
+
"epoch": 1.88,
|
27 |
+
"grad_norm": 0.7632724046707153,
|
28 |
+
"learning_rate": 0.00010625000000000001,
|
29 |
+
"loss": 0.2444,
|
30 |
+
"step": 30
|
31 |
+
},
|
32 |
+
{
|
33 |
+
"epoch": 2.5,
|
34 |
+
"grad_norm": 0.5031312704086304,
|
35 |
+
"learning_rate": 7.500000000000001e-05,
|
36 |
+
"loss": 0.1791,
|
37 |
+
"step": 40
|
38 |
+
},
|
39 |
+
{
|
40 |
+
"epoch": 3.12,
|
41 |
+
"grad_norm": 0.6666581630706787,
|
42 |
+
"learning_rate": 4.375e-05,
|
43 |
+
"loss": 0.1459,
|
44 |
+
"step": 50
|
45 |
+
},
|
46 |
+
{
|
47 |
+
"epoch": 3.75,
|
48 |
+
"grad_norm": 0.8803956508636475,
|
49 |
+
"learning_rate": 1.25e-05,
|
50 |
+
"loss": 0.1187,
|
51 |
+
"step": 60
|
52 |
+
},
|
53 |
+
{
|
54 |
+
"epoch": 4.0,
|
55 |
+
"step": 64,
|
56 |
+
"total_flos": 7.749476775936e+16,
|
57 |
+
"train_loss": 0.2629110822454095,
|
58 |
+
"train_runtime": 64.8307,
|
59 |
+
"train_samples_per_second": 15.425,
|
60 |
+
"train_steps_per_second": 0.987
|
61 |
+
}
|
62 |
+
],
|
63 |
+
"logging_steps": 10,
|
64 |
+
"max_steps": 64,
|
65 |
+
"num_input_tokens_seen": 0,
|
66 |
+
"num_train_epochs": 4,
|
67 |
+
"save_steps": 100,
|
68 |
+
"total_flos": 7.749476775936e+16,
|
69 |
+
"train_batch_size": 16,
|
70 |
+
"trial_name": null,
|
71 |
+
"trial_params": null
|
72 |
+
}
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4920
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59b0fd0e128bbccad6b3cb1d0e6ce51a75d3a5b66f1899015838ed631f927eee
|
3 |
size 4920
|