ChiefTheLord commited on
Commit
6ccdddc
verified
1 Parent(s): 51a4757

Delete checkpoints

Browse files
checkpoints/checkpoint-64/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3bc3e42a9b64e2588302c65f922098dc164e9533637b0366d543059cffc4d46e
3
- size 14851088
 
 
 
 
checkpoints/checkpoint-64/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:20eb77acf0aad2036561ff4a6a2f7ea60e5460cd7315622fe018edf6af9477fa
3
- size 29695994
 
 
 
 
checkpoints/checkpoint-64/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ed2e591b77a8475236224c0177524db10370f13296177433e7087f6779de2cd
3
- size 14244
 
 
 
 
checkpoints/checkpoint-64/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:79bdcda359cedf04bc9f65fce5ca61248f4a235c6e9c8a45682aa2dfc095ac0f
3
- size 1064
 
 
 
 
checkpoints/checkpoint-64/trainer_state.json DELETED
@@ -1,161 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 25.6,
5
- "eval_steps": 8,
6
- "global_step": 64,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 3.2,
13
- "grad_norm": 2.572068691253662,
14
- "learning_rate": 6.153846153846155e-05,
15
- "loss": 1.4317,
16
- "step": 8
17
- },
18
- {
19
- "epoch": 3.2,
20
- "eval_accuracy": 0.6066666666666667,
21
- "eval_loss": 1.3396244049072266,
22
- "eval_runtime": 4.4787,
23
- "eval_samples_per_second": 33.492,
24
- "eval_steps_per_second": 0.67,
25
- "step": 8
26
- },
27
- {
28
- "epoch": 6.4,
29
- "grad_norm": 14.756144523620605,
30
- "learning_rate": 9.91486549841951e-05,
31
- "loss": 1.3743,
32
- "step": 16
33
- },
34
- {
35
- "epoch": 6.4,
36
- "eval_accuracy": 0.6,
37
- "eval_loss": 1.4254791736602783,
38
- "eval_runtime": 4.2212,
39
- "eval_samples_per_second": 35.535,
40
- "eval_steps_per_second": 0.711,
41
- "step": 16
42
- },
43
- {
44
- "epoch": 9.6,
45
- "grad_norm": 6.530676364898682,
46
- "learning_rate": 8.895402872628352e-05,
47
- "loss": 1.3977,
48
- "step": 24
49
- },
50
- {
51
- "epoch": 9.6,
52
- "eval_accuracy": 0.6466666666666666,
53
- "eval_loss": 1.3245296478271484,
54
- "eval_runtime": 4.2384,
55
- "eval_samples_per_second": 35.391,
56
- "eval_steps_per_second": 0.708,
57
- "step": 24
58
- },
59
- {
60
- "epoch": 12.8,
61
- "grad_norm": 14.631135940551758,
62
- "learning_rate": 6.948929366463396e-05,
63
- "loss": 1.3629,
64
- "step": 32
65
- },
66
- {
67
- "epoch": 12.8,
68
- "eval_accuracy": 0.64,
69
- "eval_loss": 1.290442943572998,
70
- "eval_runtime": 5.0282,
71
- "eval_samples_per_second": 29.832,
72
- "eval_steps_per_second": 0.597,
73
- "step": 32
74
- },
75
- {
76
- "epoch": 16.0,
77
- "grad_norm": 4.518190383911133,
78
- "learning_rate": 4.5386582026834906e-05,
79
- "loss": 1.3515,
80
- "step": 40
81
- },
82
- {
83
- "epoch": 16.0,
84
- "eval_accuracy": 0.6266666666666667,
85
- "eval_loss": 1.3534621000289917,
86
- "eval_runtime": 6.0978,
87
- "eval_samples_per_second": 24.599,
88
- "eval_steps_per_second": 0.492,
89
- "step": 40
90
- },
91
- {
92
- "epoch": 19.2,
93
- "grad_norm": 10.279590606689453,
94
- "learning_rate": 2.500000000000001e-05,
95
- "loss": 1.3871,
96
- "step": 48
97
- },
98
- {
99
- "epoch": 19.2,
100
- "eval_accuracy": 0.5933333333333334,
101
- "eval_loss": 1.3667320013046265,
102
- "eval_runtime": 6.4398,
103
- "eval_samples_per_second": 23.293,
104
- "eval_steps_per_second": 0.466,
105
- "step": 48
106
- },
107
- {
108
- "epoch": 22.4,
109
- "grad_norm": 5.7001872062683105,
110
- "learning_rate": 7.489143213519301e-06,
111
- "loss": 1.3224,
112
- "step": 56
113
- },
114
- {
115
- "epoch": 22.4,
116
- "eval_accuracy": 0.6066666666666667,
117
- "eval_loss": 1.3154500722885132,
118
- "eval_runtime": 4.7475,
119
- "eval_samples_per_second": 31.595,
120
- "eval_steps_per_second": 0.632,
121
- "step": 56
122
- },
123
- {
124
- "epoch": 25.6,
125
- "grad_norm": 8.32728385925293,
126
- "learning_rate": 9.483356314779479e-08,
127
- "loss": 1.328,
128
- "step": 64
129
- },
130
- {
131
- "epoch": 25.6,
132
- "eval_accuracy": 0.6333333333333333,
133
- "eval_loss": 1.2921510934829712,
134
- "eval_runtime": 4.2106,
135
- "eval_samples_per_second": 35.625,
136
- "eval_steps_per_second": 0.712,
137
- "step": 64
138
- }
139
- ],
140
- "logging_steps": 8,
141
- "max_steps": 64,
142
- "num_input_tokens_seen": 0,
143
- "num_train_epochs": 32,
144
- "save_steps": 8,
145
- "stateful_callbacks": {
146
- "TrainerControl": {
147
- "args": {
148
- "should_epoch_stop": false,
149
- "should_evaluate": false,
150
- "should_log": false,
151
- "should_save": true,
152
- "should_training_stop": true
153
- },
154
- "attributes": {}
155
- }
156
- },
157
- "total_flos": 0.0,
158
- "train_batch_size": 64,
159
- "trial_name": null,
160
- "trial_params": null
161
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoints/checkpoint-64/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:07709a6f9df64331b59c24c1eeaafbea2a2d582622d433b37f7ed72b3574b7fc
3
- size 5112