naman1011 commited on
Commit
9fc1d56
1 Parent(s): cfc245c

Training in progress, step 3000, checkpoint

Browse files
last-checkpoint/adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7328d3c4c1f327c39e82a120e4c4a584216b22fac4f3446fd72c1dcb57e70f32
3
  size 2141578
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9046729082553bffbbf8d0e0cac1eada34c1cab928ee43f8c80538e282701a48
3
  size 2141578
last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a81b3f8494b418c7af73fb66455d6559d817413b09a91bbc8ff600f0570fb83
3
+ size 3369573916
last-checkpoint/global_step3000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e11de63a25fa3e9fa32b351f1961e034af2f67c00d98a764314d24b0ca01c9e
3
+ size 3149677
last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36f9db737adc99019fb2e6b70dc4829e420d9aa1205776e45fb618a7d0bee99d
3
+ size 3369573916
last-checkpoint/global_step3000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59c4984809cb0aeefd87b81fa3c3b4c5737ff2d057a7fd7cdd794b17190cda0b
3
+ size 3149677
last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c1188bb61cacb71a048ae120a0e4951777f2360e88c6d0389c5dc8048cfd476
3
+ size 3369573916
last-checkpoint/global_step3000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13b24420253d948bfcd1065a8e0ca1027f1c092bbc44fe7904ac2acd42e7f69a
3
+ size 3149677
last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6cd8a60749e85bfcc983fadc9c231a269ccfd246480852d2bb59492458dfe25
3
+ size 3369573916
last-checkpoint/global_step3000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59c98cf53aa131276d29bfcca76d236299c36bcd35e812669e990bc57a4c153e
3
+ size 3149677
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step2500
 
1
+ global_step3000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70b1fee1a60477fdfb37fe442104a5be1d94b9aa2faa90b681407bb84aa0b5b6
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:075d19a98a161dd41b22953b88968106e072f65a707d53d0eba42094eb565ca0
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d58ce42605b8fed10a20d163f8befeb1455bc204e34fdb098df937a29c667f0f
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08196a2ce29aaa623a1d33352a238026f278deee20c1aeafc729e6950f4d6f34
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0469f49ee1a31e6c95bee835b8fd70a89c1c7492a85f2a3e27479d0023352b45
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:864a0722927155f4e5989416d78f8a8d144c5a196f6850f853c9c218e30d7178
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60b3ac292cfaee329c617a744e6a245f290a629973a48a421885f424abc14c41
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d5921de3329d7f101252046b392f3f099daa7f4bbee0195234f7c5c1f2469a2
3
  size 15024
last-checkpoint/trainer_state.json CHANGED
@@ -1,49 +1,25 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
  "eval_steps": 500,
6
- "global_step": 2500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 2.0,
13
- "learning_rate": 0.01,
14
- "loss": 0.6125,
15
- "step": 500
16
- },
17
- {
18
- "epoch": 4.0,
19
- "learning_rate": 0.01,
20
- "loss": 0.1287,
21
- "step": 1000
22
- },
23
- {
24
- "epoch": 6.0,
25
- "learning_rate": 0.01,
26
- "loss": 0.1689,
27
- "step": 1500
28
- },
29
- {
30
- "epoch": 8.0,
31
- "learning_rate": 0.01,
32
- "loss": 0.1537,
33
- "step": 2000
34
- },
35
- {
36
- "epoch": 10.0,
37
- "learning_rate": 0.01,
38
- "loss": 0.1332,
39
- "step": 2500
40
  }
41
  ],
42
- "logging_steps": 500,
43
- "max_steps": 2500,
44
- "num_train_epochs": 10,
45
- "save_steps": 500,
46
- "total_flos": 422580387840.0,
47
  "trial_name": null,
48
  "trial_params": null
49
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.1727912431587177,
5
  "eval_steps": 500,
6
+ "global_step": 3000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 1.17,
13
+ "learning_rate": 0.0001,
14
+ "loss": 0.204,
15
+ "step": 3000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  }
17
  ],
18
+ "logging_steps": 3000,
19
+ "max_steps": 12790,
20
+ "num_train_epochs": 5,
21
+ "save_steps": 3000,
22
+ "total_flos": 39574520725504.0,
23
  "trial_name": null,
24
  "trial_params": null
25
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8639ef87c97e0b1db1451ec2c0e630582811a1a01d4762880d5387664e980641
3
  size 6840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdf6b5aa86c1d81710c05be6ff9474216751b563adb5d2a3249d44c9bf2f85ad
3
  size 6840