Training in progress, epoch 6
Browse files
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29835597
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fb3d8a1853e13390a98cd166d2bc6fd6a4717b89fc6bec01ffac915b9e9a1b5
|
3 |
size 29835597
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14929953
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:567ae17da0df69e4df668d4830ffc23cb2af18380f5ba3828cf1fbda5bf864ed
|
3 |
size 14929953
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3f3bf7904e607c5dfb520da7105305892edb040d8a8e1c00a1f80d7f74d2088
|
3 |
+
size 14631
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b1c8714dde8960a024761c760981e691e4e3f2fad0d6176179cb6463509d73a
|
3 |
size 623
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -36,11 +36,17 @@
|
|
36 |
"learning_rate": 3.5000000000000004e-05,
|
37 |
"loss": 0.0168,
|
38 |
"step": 1700
|
|
|
|
|
|
|
|
|
|
|
|
|
39 |
}
|
40 |
],
|
41 |
"max_steps": 4080,
|
42 |
"num_train_epochs": 12,
|
43 |
-
"total_flos":
|
44 |
"trial_name": null,
|
45 |
"trial_params": null
|
46 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 6.0,
|
5 |
+
"global_step": 2040,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
36 |
"learning_rate": 3.5000000000000004e-05,
|
37 |
"loss": 0.0168,
|
38 |
"step": 1700
|
39 |
+
},
|
40 |
+
{
|
41 |
+
"epoch": 6.0,
|
42 |
+
"learning_rate": 3e-05,
|
43 |
+
"loss": 0.0159,
|
44 |
+
"step": 2040
|
45 |
}
|
46 |
],
|
47 |
"max_steps": 4080,
|
48 |
"num_train_epochs": 12,
|
49 |
+
"total_flos": 8.576428636687565e+17,
|
50 |
"trial_name": null,
|
51 |
"trial_params": null
|
52 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14929953
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:567ae17da0df69e4df668d4830ffc23cb2af18380f5ba3828cf1fbda5bf864ed
|
3 |
size 14929953
|
runs/Aug01_18-12-22_8ec249145423/events.out.tfevents.1659377547.8ec249145423.72.2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3859222a41e6fcdba312f8001a8fb0bfaa15a3537fe6aa7f5431e267490877b
|
3 |
+
size 5194
|