Training in progress, step 3000, checkpoint
Browse files- last-checkpoint/adapter_model.bin +1 -1
- last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_model_states.pt +3 -0
- last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- last-checkpoint/latest +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/trainer_state.json +11 -35
- last-checkpoint/training_args.bin +1 -1
last-checkpoint/adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2141578
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9046729082553bffbbf8d0e0cac1eada34c1cab928ee43f8c80538e282701a48
|
3 |
size 2141578
|
last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a81b3f8494b418c7af73fb66455d6559d817413b09a91bbc8ff600f0570fb83
|
3 |
+
size 3369573916
|
last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e11de63a25fa3e9fa32b351f1961e034af2f67c00d98a764314d24b0ca01c9e
|
3 |
+
size 3149677
|
last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36f9db737adc99019fb2e6b70dc4829e420d9aa1205776e45fb618a7d0bee99d
|
3 |
+
size 3369573916
|
last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59c4984809cb0aeefd87b81fa3c3b4c5737ff2d057a7fd7cdd794b17190cda0b
|
3 |
+
size 3149677
|
last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c1188bb61cacb71a048ae120a0e4951777f2360e88c6d0389c5dc8048cfd476
|
3 |
+
size 3369573916
|
last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13b24420253d948bfcd1065a8e0ca1027f1c092bbc44fe7904ac2acd42e7f69a
|
3 |
+
size 3149677
|
last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6cd8a60749e85bfcc983fadc9c231a269ccfd246480852d2bb59492458dfe25
|
3 |
+
size 3369573916
|
last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59c98cf53aa131276d29bfcca76d236299c36bcd35e812669e990bc57a4c153e
|
3 |
+
size 3149677
|
last-checkpoint/latest
CHANGED
@@ -1 +1 @@
|
|
1 |
-
|
|
|
1 |
+
global_step3000
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:075d19a98a161dd41b22953b88968106e072f65a707d53d0eba42094eb565ca0
|
3 |
size 15024
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08196a2ce29aaa623a1d33352a238026f278deee20c1aeafc729e6950f4d6f34
|
3 |
size 15024
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:864a0722927155f4e5989416d78f8a8d144c5a196f6850f853c9c218e30d7178
|
3 |
size 15024
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 15024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d5921de3329d7f101252046b392f3f099daa7f4bbee0195234f7c5c1f2469a2
|
3 |
size 15024
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,49 +1,25 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
"eval_steps": 500,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
-
"epoch":
|
13 |
-
"learning_rate": 0.
|
14 |
-
"loss": 0.
|
15 |
-
"step":
|
16 |
-
},
|
17 |
-
{
|
18 |
-
"epoch": 4.0,
|
19 |
-
"learning_rate": 0.01,
|
20 |
-
"loss": 0.1287,
|
21 |
-
"step": 1000
|
22 |
-
},
|
23 |
-
{
|
24 |
-
"epoch": 6.0,
|
25 |
-
"learning_rate": 0.01,
|
26 |
-
"loss": 0.1689,
|
27 |
-
"step": 1500
|
28 |
-
},
|
29 |
-
{
|
30 |
-
"epoch": 8.0,
|
31 |
-
"learning_rate": 0.01,
|
32 |
-
"loss": 0.1537,
|
33 |
-
"step": 2000
|
34 |
-
},
|
35 |
-
{
|
36 |
-
"epoch": 10.0,
|
37 |
-
"learning_rate": 0.01,
|
38 |
-
"loss": 0.1332,
|
39 |
-
"step": 2500
|
40 |
}
|
41 |
],
|
42 |
-
"logging_steps":
|
43 |
-
"max_steps":
|
44 |
-
"num_train_epochs":
|
45 |
-
"save_steps":
|
46 |
-
"total_flos":
|
47 |
"trial_name": null,
|
48 |
"trial_params": null
|
49 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 1.1727912431587177,
|
5 |
"eval_steps": 500,
|
6 |
+
"global_step": 3000,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
10 |
"log_history": [
|
11 |
{
|
12 |
+
"epoch": 1.17,
|
13 |
+
"learning_rate": 0.0001,
|
14 |
+
"loss": 0.204,
|
15 |
+
"step": 3000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
16 |
}
|
17 |
],
|
18 |
+
"logging_steps": 3000,
|
19 |
+
"max_steps": 12790,
|
20 |
+
"num_train_epochs": 5,
|
21 |
+
"save_steps": 3000,
|
22 |
+
"total_flos": 39574520725504.0,
|
23 |
"trial_name": null,
|
24 |
"trial_params": null
|
25 |
}
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdf6b5aa86c1d81710c05be6ff9474216751b563adb5d2a3249d44c9bf2f85ad
|
3 |
size 6840
|