Training in progress, step 13
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +27 -3
- pytorch_model.bin +1 -1
- runs/Jul19_18-03-38_47ad500bc002/events.out.tfevents.1689789837.47ad500bc002.2216.8 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1044539653
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c7a59da2efa72379bcc54eca155c61485a34016dc472390837f7e6667e1f381
|
3 |
size 1044539653
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5018531153
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
|
3 |
size 5018531153
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:512f018b467c169e2aa0e142ea191b73786d79604dace238e3d4834d1df266e8
|
3 |
size 14575
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ecb4b4bc15e0509048b47d006eba35fc56dec209d6d90c42b552a5ead63d9d9
|
3 |
size 557
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89ce2185c6877d072e8ca86c937358d8e8317963d32ce90379cdc35bd6460cdf
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -60,11 +60,35 @@
|
|
60 |
"learning_rate": 0.0002,
|
61 |
"loss": 1.1174,
|
62 |
"step": 9
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
63 |
}
|
64 |
],
|
65 |
"max_steps": 500,
|
66 |
"num_train_epochs": 125,
|
67 |
-
"total_flos":
|
68 |
"trial_name": null,
|
69 |
"trial_params": null
|
70 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 3.25,
|
5 |
+
"global_step": 13,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
60 |
"learning_rate": 0.0002,
|
61 |
"loss": 1.1174,
|
62 |
"step": 9
|
63 |
+
},
|
64 |
+
{
|
65 |
+
"epoch": 2.5,
|
66 |
+
"learning_rate": 0.0002,
|
67 |
+
"loss": 0.9802,
|
68 |
+
"step": 10
|
69 |
+
},
|
70 |
+
{
|
71 |
+
"epoch": 2.75,
|
72 |
+
"learning_rate": 0.0002,
|
73 |
+
"loss": 0.8965,
|
74 |
+
"step": 11
|
75 |
+
},
|
76 |
+
{
|
77 |
+
"epoch": 3.0,
|
78 |
+
"learning_rate": 0.0002,
|
79 |
+
"loss": 0.7951,
|
80 |
+
"step": 12
|
81 |
+
},
|
82 |
+
{
|
83 |
+
"epoch": 3.25,
|
84 |
+
"learning_rate": 0.0002,
|
85 |
+
"loss": 0.6422,
|
86 |
+
"step": 13
|
87 |
}
|
88 |
],
|
89 |
"max_steps": 500,
|
90 |
"num_train_epochs": 125,
|
91 |
+
"total_flos": 2168782279802880.0,
|
92 |
"trial_name": null,
|
93 |
"trial_params": null
|
94 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5018531153
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c1829e1d9fe90b41ecbfccc04d70f06a21fb290a57b54fa1d7cdb906bac3a50
|
3 |
size 5018531153
|
runs/Jul19_18-03-38_47ad500bc002/events.out.tfevents.1689789837.47ad500bc002.2216.8
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20ae9a3f24920171c22cccb9e05be58bfecabaa437ec9df242a7dd0a1a1bd2bf
|
3 |
+
size 6522
|