Model save
Browse files- README.md +26 -38
- added_tokens.json +427 -428
- model.safetensors +1 -1
- tokenizer.json +0 -0
- tokenizer_config.json +0 -0
- training_args.bin +1 -1
README.md
CHANGED
@@ -2,23 +2,11 @@
|
|
2 |
library_name: transformers
|
3 |
tags:
|
4 |
- generated_from_trainer
|
5 |
-
datasets:
|
6 |
-
- kanishka/babylm2-rewritten-clean-spacy
|
7 |
metrics:
|
8 |
- accuracy
|
9 |
model-index:
|
10 |
- name: opt-babylm2-rewritten-clean-spacy-earlystop-bpe_seed-42_1e-3
|
11 |
-
results:
|
12 |
-
- task:
|
13 |
-
name: Causal Language Modeling
|
14 |
-
type: text-generation
|
15 |
-
dataset:
|
16 |
-
name: kanishka/babylm2-rewritten-clean-spacy
|
17 |
-
type: kanishka/babylm2-rewritten-clean-spacy
|
18 |
-
metrics:
|
19 |
-
- name: Accuracy
|
20 |
-
type: accuracy
|
21 |
-
value: 0.47877642614021604
|
22 |
---
|
23 |
|
24 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
@@ -26,10 +14,10 @@ should probably proofread and complete it, then remove this comment. -->
|
|
26 |
|
27 |
# opt-babylm2-rewritten-clean-spacy-earlystop-bpe_seed-42_1e-3
|
28 |
|
29 |
-
This model was trained from scratch on
|
30 |
It achieves the following results on the evaluation set:
|
31 |
-
- Loss: 2.
|
32 |
-
- Accuracy: 0.
|
33 |
|
34 |
## Model description
|
35 |
|
@@ -62,28 +50,28 @@ The following hyperparameters were used during training:
|
|
62 |
|
63 |
### Training results
|
64 |
|
65 |
-
| Training Loss | Epoch
|
66 |
-
|
67 |
-
| 4.
|
68 |
-
| 3.
|
69 |
-
| 3.
|
70 |
-
| 2.
|
71 |
-
| 2.
|
72 |
-
| 2.
|
73 |
-
| 2.
|
74 |
-
| 2.
|
75 |
-
| 2.
|
76 |
-
| 2.
|
77 |
-
| 2.
|
78 |
-
| 2.
|
79 |
-
| 2.
|
80 |
-
| 2.
|
81 |
-
| 2.
|
82 |
-
| 2.
|
83 |
-
| 2.
|
84 |
-
| 2.
|
85 |
-
| 2.
|
86 |
-
| 2.
|
87 |
|
88 |
|
89 |
### Framework versions
|
|
|
2 |
library_name: transformers
|
3 |
tags:
|
4 |
- generated_from_trainer
|
|
|
|
|
5 |
metrics:
|
6 |
- accuracy
|
7 |
model-index:
|
8 |
- name: opt-babylm2-rewritten-clean-spacy-earlystop-bpe_seed-42_1e-3
|
9 |
+
results: []
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
---
|
11 |
|
12 |
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
|
|
14 |
|
15 |
# opt-babylm2-rewritten-clean-spacy-earlystop-bpe_seed-42_1e-3
|
16 |
|
17 |
+
This model was trained from scratch on an unknown dataset.
|
18 |
It achieves the following results on the evaluation set:
|
19 |
+
- Loss: 2.6840
|
20 |
+
- Accuracy: 0.4787
|
21 |
|
22 |
## Model description
|
23 |
|
|
|
50 |
|
51 |
### Training results
|
52 |
|
53 |
+
| Training Loss | Epoch | Step | Validation Loss | Accuracy |
|
54 |
+
|:-------------:|:-------:|:-----:|:---------------:|:--------:|
|
55 |
+
| 4.1044 | 1.0 | 2256 | 3.8204 | 0.3604 |
|
56 |
+
| 3.4457 | 2.0 | 4512 | 3.3046 | 0.4093 |
|
57 |
+
| 3.13 | 3.0 | 6768 | 3.0945 | 0.4299 |
|
58 |
+
| 2.9219 | 4.0 | 9024 | 2.9890 | 0.4404 |
|
59 |
+
| 2.8444 | 5.0 | 11280 | 2.9282 | 0.4466 |
|
60 |
+
| 2.7883 | 6.0 | 13536 | 2.8910 | 0.4508 |
|
61 |
+
| 2.7434 | 7.0 | 15792 | 2.8579 | 0.4545 |
|
62 |
+
| 2.7158 | 8.0 | 18048 | 2.8428 | 0.4560 |
|
63 |
+
| 2.6905 | 9.0 | 20304 | 2.8298 | 0.4573 |
|
64 |
+
| 2.6697 | 10.0 | 22560 | 2.8169 | 0.4592 |
|
65 |
+
| 2.6509 | 11.0 | 24816 | 2.8080 | 0.4601 |
|
66 |
+
| 2.6494 | 12.0 | 27072 | 2.8020 | 0.4607 |
|
67 |
+
| 2.6384 | 13.0 | 29328 | 2.7958 | 0.4616 |
|
68 |
+
| 2.6297 | 14.0 | 31584 | 2.7939 | 0.4620 |
|
69 |
+
| 2.612 | 15.0 | 33840 | 2.7649 | 0.4653 |
|
70 |
+
| 2.5667 | 16.0 | 36096 | 2.7425 | 0.4686 |
|
71 |
+
| 2.5177 | 17.0 | 38352 | 2.7206 | 0.4714 |
|
72 |
+
| 2.4607 | 18.0 | 40608 | 2.6999 | 0.4746 |
|
73 |
+
| 2.397 | 19.0 | 42864 | 2.6865 | 0.4773 |
|
74 |
+
| 2.3241 | 19.9915 | 45100 | 2.6840 | 0.4787 |
|
75 |
|
76 |
|
77 |
### Framework versions
|
added_tokens.json
CHANGED
@@ -1,430 +1,429 @@
|
|
1 |
{
|
2 |
-
"
|
3 |
-
"
|
4 |
-
"
|
5 |
-
"
|
6 |
-
"
|
7 |
-
"
|
8 |
-
"
|
9 |
-
"
|
10 |
-
"
|
11 |
-
"
|
12 |
-
"
|
13 |
-
"
|
14 |
-
"
|
15 |
-
"
|
16 |
-
"
|
17 |
-
"
|
18 |
-
"
|
19 |
-
"
|
20 |
-
"
|
21 |
-
"
|
22 |
-
"
|
23 |
-
"
|
24 |
-
"
|
25 |
-
"
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
"
|
30 |
-
"
|
31 |
-
"
|
32 |
-
"
|
33 |
-
"
|
34 |
-
"
|
35 |
-
"
|
36 |
-
"
|
37 |
-
"
|
38 |
-
"
|
39 |
-
"
|
40 |
-
"
|
41 |
-
"
|
42 |
-
"
|
43 |
-
"
|
44 |
-
"
|
45 |
-
"
|
46 |
-
"
|
47 |
-
"
|
48 |
-
"
|
49 |
-
"
|
50 |
-
"
|
51 |
-
"
|
52 |
-
"
|
53 |
-
"
|
54 |
-
"
|
55 |
-
"
|
56 |
-
"
|
57 |
-
"
|
58 |
-
"
|
59 |
-
"
|
60 |
-
"
|
61 |
-
"
|
62 |
-
"
|
63 |
-
"
|
64 |
-
"
|
65 |
-
"
|
66 |
-
"
|
67 |
-
"
|
68 |
-
"
|
69 |
-
"
|
70 |
-
"
|
71 |
-
"
|
72 |
-
"
|
73 |
-
"
|
74 |
-
"
|
75 |
-
"
|
76 |
-
"
|
77 |
-
"
|
78 |
-
"
|
79 |
-
"
|
80 |
-
"
|
81 |
-
"
|
82 |
-
"
|
83 |
-
"
|
84 |
-
"
|
85 |
-
"
|
86 |
-
"
|
87 |
-
"
|
88 |
-
"
|
89 |
-
"
|
90 |
-
"
|
91 |
-
"
|
92 |
-
"
|
93 |
-
"
|
94 |
-
"
|
95 |
-
"
|
96 |
-
"
|
97 |
-
"
|
98 |
-
"
|
99 |
-
"
|
100 |
-
"
|
101 |
-
"
|
102 |
-
"
|
103 |
-
"
|
104 |
-
"
|
105 |
-
"
|
106 |
-
"
|
107 |
-
"
|
108 |
-
"
|
109 |
-
"
|
110 |
-
"
|
111 |
-
"
|
112 |
-
"
|
113 |
-
"
|
114 |
-
"
|
115 |
-
"
|
116 |
-
"
|
117 |
-
"
|
118 |
-
"
|
119 |
-
"
|
120 |
-
"
|
121 |
-
"
|
122 |
-
"
|
123 |
-
"
|
124 |
-
"
|
125 |
-
"
|
126 |
-
"
|
127 |
-
"
|
128 |
-
"
|
129 |
-
"
|
130 |
-
"
|
131 |
-
"
|
132 |
-
"
|
133 |
-
"
|
134 |
-
"
|
135 |
-
"
|
136 |
-
"
|
137 |
-
"
|
138 |
-
"
|
139 |
-
"
|
140 |
-
"
|
141 |
-
"
|
142 |
-
"
|
143 |
-
"
|
144 |
-
"
|
145 |
-
"
|
146 |
-
"
|
147 |
-
"
|
148 |
-
"
|
149 |
-
"
|
150 |
-
"
|
151 |
-
"
|
152 |
-
"
|
153 |
-
"
|
154 |
-
"
|
155 |
-
"
|
156 |
-
"
|
157 |
-
"
|
158 |
-
"
|
159 |
-
"
|
160 |
-
"
|
161 |
-
"
|
162 |
-
"
|
163 |
-
"
|
164 |
-
"
|
165 |
-
"
|
166 |
-
"
|
167 |
-
"
|
168 |
-
"
|
169 |
-
"
|
170 |
-
"
|
171 |
-
"
|
172 |
-
"
|
173 |
-
"
|
174 |
-
"
|
175 |
-
"
|
176 |
-
"
|
177 |
-
"
|
178 |
-
"
|
179 |
-
"
|
180 |
-
"
|
181 |
-
"
|
182 |
-
"
|
183 |
-
"
|
184 |
-
"
|
185 |
-
"
|
186 |
-
"
|
187 |
-
"
|
188 |
-
"
|
189 |
-
"
|
190 |
-
"
|
191 |
-
"
|
192 |
-
"
|
193 |
-
"
|
194 |
-
"
|
195 |
-
"
|
196 |
-
"
|
197 |
-
"
|
198 |
-
"
|
199 |
-
"
|
200 |
-
"
|
201 |
-
"
|
202 |
-
"
|
203 |
-
"
|
204 |
-
"
|
205 |
-
"
|
206 |
-
"
|
207 |
-
"
|
208 |
-
"
|
209 |
-
"
|
210 |
-
"
|
211 |
-
"
|
212 |
-
"
|
213 |
-
"
|
214 |
-
"
|
215 |
-
"
|
216 |
-
"
|
217 |
-
"
|
218 |
-
"
|
219 |
-
"
|
220 |
-
"
|
221 |
-
"
|
222 |
-
"
|
223 |
-
"
|
224 |
-
"
|
225 |
-
"
|
226 |
-
"
|
227 |
-
"
|
228 |
-
"
|
229 |
-
"
|
230 |
-
"
|
231 |
-
"
|
232 |
-
"
|
233 |
-
"
|
234 |
-
"
|
235 |
-
"
|
236 |
-
"
|
237 |
-
"
|
238 |
-
"
|
239 |
-
"
|
240 |
-
"
|
241 |
-
"
|
242 |
-
"
|
243 |
-
"
|
244 |
-
"
|
245 |
-
"
|
246 |
-
"
|
247 |
-
"
|
248 |
-
"
|
249 |
-
"
|
250 |
-
"
|
251 |
-
"
|
252 |
-
"
|
253 |
-
"
|
254 |
-
"
|
255 |
-
"
|
256 |
-
"
|
257 |
-
"
|
258 |
-
"
|
259 |
-
"
|
260 |
-
"
|
261 |
-
"
|
262 |
-
"
|
263 |
-
"
|
264 |
-
"
|
265 |
-
"
|
266 |
-
"
|
267 |
-
"
|
268 |
-
"
|
269 |
-
"
|
270 |
-
"
|
271 |
-
"
|
272 |
-
"
|
273 |
-
"
|
274 |
-
"
|
275 |
-
"
|
276 |
-
"
|
277 |
-
"
|
278 |
-
"
|
279 |
-
"
|
280 |
-
"
|
281 |
-
"
|
282 |
-
"
|
283 |
-
"
|
284 |
-
"
|
285 |
-
"
|
286 |
-
"
|
287 |
-
"
|
288 |
-
"
|
289 |
-
"
|
290 |
-
"
|
291 |
-
"
|
292 |
-
"
|
293 |
-
"
|
294 |
-
"
|
295 |
-
"
|
296 |
-
"
|
297 |
-
"
|
298 |
-
"
|
299 |
-
"
|
300 |
-
"
|
301 |
-
"
|
302 |
-
"
|
303 |
-
"
|
304 |
-
"
|
305 |
-
"
|
306 |
-
"
|
307 |
-
"
|
308 |
-
"
|
309 |
-
"
|
310 |
-
"
|
311 |
-
"
|
312 |
-
"
|
313 |
-
"
|
314 |
-
"
|
315 |
-
"
|
316 |
-
"
|
317 |
-
"
|
318 |
-
"
|
319 |
-
"
|
320 |
-
"
|
321 |
-
"
|
322 |
-
"
|
323 |
-
"
|
324 |
-
"
|
325 |
-
"
|
326 |
-
"
|
327 |
-
"
|
328 |
-
"
|
329 |
-
"
|
330 |
-
"
|
331 |
-
"
|
332 |
-
"
|
333 |
-
"
|
334 |
-
"
|
335 |
-
"
|
336 |
-
"
|
337 |
-
"
|
338 |
-
"
|
339 |
-
"
|
340 |
-
"
|
341 |
-
"
|
342 |
-
"
|
343 |
-
"
|
344 |
-
"
|
345 |
-
"
|
346 |
-
"
|
347 |
-
"
|
348 |
-
"
|
349 |
-
"
|
350 |
-
"
|
351 |
-
"
|
352 |
-
"
|
353 |
-
"
|
354 |
-
"
|
355 |
-
"
|
356 |
-
"
|
357 |
-
"
|
358 |
-
"
|
359 |
-
"
|
360 |
-
"
|
361 |
-
"
|
362 |
-
"
|
363 |
-
"
|
364 |
-
"
|
365 |
-
"
|
366 |
-
"
|
367 |
-
"
|
368 |
-
"
|
369 |
-
"
|
370 |
-
"
|
371 |
-
"
|
372 |
-
"
|
373 |
-
"
|
374 |
-
"
|
375 |
-
"
|
376 |
-
"
|
377 |
-
"
|
378 |
-
"
|
379 |
-
"
|
380 |
-
"
|
381 |
-
"
|
382 |
-
"
|
383 |
-
"
|
384 |
-
"
|
385 |
-
"
|
386 |
-
"
|
387 |
-
"
|
388 |
-
"
|
389 |
-
"
|
390 |
-
"
|
391 |
-
"
|
392 |
-
"
|
393 |
-
"
|
394 |
-
"
|
395 |
-
"
|
396 |
-
"
|
397 |
-
"
|
398 |
-
"
|
399 |
-
"
|
400 |
-
"
|
401 |
-
"
|
402 |
-
"
|
403 |
-
"
|
404 |
-
"
|
405 |
-
"
|
406 |
-
"
|
407 |
-
"
|
408 |
-
"
|
409 |
-
"
|
410 |
-
"
|
411 |
-
"
|
412 |
-
"
|
413 |
-
"
|
414 |
-
"
|
415 |
-
"
|
416 |
-
"
|
417 |
-
"
|
418 |
-
"
|
419 |
-
"
|
420 |
-
"
|
421 |
-
"
|
422 |
-
"
|
423 |
-
"
|
424 |
-
"
|
425 |
-
"
|
426 |
-
"
|
427 |
-
"
|
428 |
-
"
|
429 |
-
"Ġ999": 16570
|
430 |
}
|
|
|
1 |
{
|
2 |
+
"01": 16510,
|
3 |
+
"02": 16511,
|
4 |
+
"03": 16512,
|
5 |
+
"04": 16573,
|
6 |
+
"05": 16537,
|
7 |
+
"06": 16611,
|
8 |
+
"07": 16464,
|
9 |
+
"08": 16475,
|
10 |
+
"09": 16598,
|
11 |
+
"1000000000": 16466,
|
12 |
+
"1001": 16551,
|
13 |
+
"102": 16472,
|
14 |
+
"103": 16393,
|
15 |
+
"104": 16545,
|
16 |
+
"106": 16546,
|
17 |
+
"1066": 16702,
|
18 |
+
"107": 16444,
|
19 |
+
"108": 16445,
|
20 |
+
"109": 16538,
|
21 |
+
"1100": 16424,
|
22 |
+
"11000": 16539,
|
23 |
+
"111": 16389,
|
24 |
+
"112": 16446,
|
25 |
+
"113": 16447,
|
26 |
+
"114": 16450,
|
27 |
+
"115": 16451,
|
28 |
+
"116": 16499,
|
29 |
+
"117": 16452,
|
30 |
+
"118": 16443,
|
31 |
+
"119": 16453,
|
32 |
+
"12000": 16529,
|
33 |
+
"120000": 16570,
|
34 |
+
"121": 16414,
|
35 |
+
"122": 16456,
|
36 |
+
"123": 16505,
|
37 |
+
"124": 16549,
|
38 |
+
"1250": 16541,
|
39 |
+
"126": 16488,
|
40 |
+
"127": 16398,
|
41 |
+
"128": 16550,
|
42 |
+
"129": 16458,
|
43 |
+
"1300": 16425,
|
44 |
+
"13000": 16601,
|
45 |
+
"131": 16410,
|
46 |
+
"132": 16459,
|
47 |
+
"133": 16477,
|
48 |
+
"134": 16460,
|
49 |
+
"135": 16396,
|
50 |
+
"136": 16480,
|
51 |
+
"137": 16527,
|
52 |
+
"138": 16487,
|
53 |
+
"139": 16532,
|
54 |
+
"1400": 16426,
|
55 |
+
"14000": 16553,
|
56 |
+
"141": 16416,
|
57 |
+
"142": 16624,
|
58 |
+
"143": 16401,
|
59 |
+
"144": 16521,
|
60 |
+
"145": 16386,
|
61 |
+
"146": 16502,
|
62 |
+
"147": 16578,
|
63 |
+
"148": 16506,
|
64 |
+
"149": 16556,
|
65 |
+
"15000": 16399,
|
66 |
+
"150000": 16481,
|
67 |
+
"151": 16417,
|
68 |
+
"152": 16582,
|
69 |
+
"153": 16390,
|
70 |
+
"154": 16618,
|
71 |
+
"155": 16643,
|
72 |
+
"156": 16391,
|
73 |
+
"157": 16682,
|
74 |
+
"158": 16496,
|
75 |
+
"159": 16580,
|
76 |
+
"1600": 16427,
|
77 |
+
"16000": 16482,
|
78 |
+
"1603": 16572,
|
79 |
+
"161": 16437,
|
80 |
+
"162": 16574,
|
81 |
+
"1620": 16729,
|
82 |
+
"163": 16392,
|
83 |
+
"164": 16629,
|
84 |
+
"165": 16554,
|
85 |
+
"166": 16677,
|
86 |
+
"1660": 16565,
|
87 |
+
"1666": 16633,
|
88 |
+
"167": 16692,
|
89 |
+
"168": 16461,
|
90 |
+
"169": 16479,
|
91 |
+
"1700": 16428,
|
92 |
+
"17000": 16571,
|
93 |
+
"1707": 16785,
|
94 |
+
"171": 16504,
|
95 |
+
"172": 16584,
|
96 |
+
"173": 16557,
|
97 |
+
"174": 16542,
|
98 |
+
"1740": 16620,
|
99 |
+
"1748": 16793,
|
100 |
+
"1750": 16685,
|
101 |
+
"1755": 16737,
|
102 |
+
"1756": 16791,
|
103 |
+
"1758": 16717,
|
104 |
+
"1760": 16731,
|
105 |
+
"1762": 16701,
|
106 |
+
"1763": 16755,
|
107 |
+
"1764": 16773,
|
108 |
+
"1765": 16772,
|
109 |
+
"1768": 16720,
|
110 |
+
"1770": 16805,
|
111 |
+
"1772": 16803,
|
112 |
+
"1773": 16792,
|
113 |
+
"1774": 16751,
|
114 |
+
"1775": 16723,
|
115 |
+
"1776": 16728,
|
116 |
+
"1777": 16790,
|
117 |
+
"1778": 16694,
|
118 |
+
"1779": 16724,
|
119 |
+
"1780": 16700,
|
120 |
+
"1781": 16752,
|
121 |
+
"1783": 16769,
|
122 |
+
"1784": 16767,
|
123 |
+
"1785": 16768,
|
124 |
+
"1786": 16613,
|
125 |
+
"1787": 16638,
|
126 |
+
"1788": 16650,
|
127 |
+
"1789": 16465,
|
128 |
+
"1790": 16591,
|
129 |
+
"1791": 16794,
|
130 |
+
"1792": 16738,
|
131 |
+
"1793": 16714,
|
132 |
+
"1794": 16739,
|
133 |
+
"1795": 16756,
|
134 |
+
"1796": 16797,
|
135 |
+
"1797": 16796,
|
136 |
+
"1798": 16716,
|
137 |
+
"1799": 16634,
|
138 |
+
"18000": 16599,
|
139 |
+
"1801": 16801,
|
140 |
+
"1802": 16759,
|
141 |
+
"1803": 16802,
|
142 |
+
"1804": 16735,
|
143 |
+
"1805": 16798,
|
144 |
+
"1806": 16689,
|
145 |
+
"1807": 16757,
|
146 |
+
"1808": 16746,
|
147 |
+
"1809": 16761,
|
148 |
+
"181": 16420,
|
149 |
+
"1810": 16804,
|
150 |
+
"1811": 16706,
|
151 |
+
"1812": 16625,
|
152 |
+
"1813": 16712,
|
153 |
+
"1814": 16609,
|
154 |
+
"1815": 16703,
|
155 |
+
"1816": 16734,
|
156 |
+
"1817": 16758,
|
157 |
+
"1818": 16704,
|
158 |
+
"1819": 16636,
|
159 |
+
"182": 16412,
|
160 |
+
"1820": 16708,
|
161 |
+
"1821": 16707,
|
162 |
+
"1822": 16781,
|
163 |
+
"1823": 16774,
|
164 |
+
"1824": 16637,
|
165 |
+
"1825": 16709,
|
166 |
+
"1826": 16710,
|
167 |
+
"1827": 16711,
|
168 |
+
"1828": 16799,
|
169 |
+
"1829": 16760,
|
170 |
+
"1830": 16668,
|
171 |
+
"1831": 16764,
|
172 |
+
"1832": 16779,
|
173 |
+
"1833": 16590,
|
174 |
+
"1834": 16795,
|
175 |
+
"1835": 16666,
|
176 |
+
"1836": 16754,
|
177 |
+
"1837": 16736,
|
178 |
+
"1838": 16800,
|
179 |
+
"1839": 16669,
|
180 |
+
"1840": 16576,
|
181 |
+
"1841": 16775,
|
182 |
+
"1842": 16780,
|
183 |
+
"1843": 16763,
|
184 |
+
"1844": 16489,
|
185 |
+
"1845": 16753,
|
186 |
+
"1846": 16670,
|
187 |
+
"1847": 16671,
|
188 |
+
"1848": 16655,
|
189 |
+
"1849": 16732,
|
190 |
+
"1850": 16567,
|
191 |
+
"1851": 16765,
|
192 |
+
"1852": 16713,
|
193 |
+
"1853": 16727,
|
194 |
+
"1854": 16786,
|
195 |
+
"1855": 16733,
|
196 |
+
"1856": 16610,
|
197 |
+
"1857": 16776,
|
198 |
+
"1858": 16672,
|
199 |
+
"1859": 16687,
|
200 |
+
"1860": 16566,
|
201 |
+
"1861": 16664,
|
202 |
+
"1862": 16652,
|
203 |
+
"1863": 16762,
|
204 |
+
"1864": 16676,
|
205 |
+
"1865": 16686,
|
206 |
+
"1866": 16663,
|
207 |
+
"1867": 16673,
|
208 |
+
"1868": 16698,
|
209 |
+
"1869": 16631,
|
210 |
+
"1871": 16699,
|
211 |
+
"1872": 16766,
|
212 |
+
"1873": 16747,
|
213 |
+
"1874": 16748,
|
214 |
+
"1875": 16782,
|
215 |
+
"1876": 16749,
|
216 |
+
"1877": 16722,
|
217 |
+
"1878": 16715,
|
218 |
+
"1879": 16648,
|
219 |
+
"1880": 16587,
|
220 |
+
"1881": 16695,
|
221 |
+
"1882": 16777,
|
222 |
+
"1883": 16778,
|
223 |
+
"1884": 16750,
|
224 |
+
"1885": 16783,
|
225 |
+
"1886": 16730,
|
226 |
+
"1887": 16770,
|
227 |
+
"1888": 16667,
|
228 |
+
"1889": 16647,
|
229 |
+
"1891": 16771,
|
230 |
+
"1892": 16646,
|
231 |
+
"1893": 16674,
|
232 |
+
"1894": 16596,
|
233 |
+
"1895": 16725,
|
234 |
+
"1896": 16696,
|
235 |
+
"1897": 16654,
|
236 |
+
"1898": 16653,
|
237 |
+
"1899": 16690,
|
238 |
+
"1901": 16651,
|
239 |
+
"1902": 16697,
|
240 |
+
"1903": 16691,
|
241 |
+
"1904": 16534,
|
242 |
+
"1906": 16588,
|
243 |
+
"1907": 16635,
|
244 |
+
"192220": 16807,
|
245 |
+
"2000000": 16490,
|
246 |
+
"201920": 16809,
|
247 |
+
"202021": 16810,
|
248 |
+
"2025": 16644,
|
249 |
+
"203": 16665,
|
250 |
+
"204": 16597,
|
251 |
+
"205": 16513,
|
252 |
+
"206": 16400,
|
253 |
+
"207": 16726,
|
254 |
+
"208": 16581,
|
255 |
+
"209": 16455,
|
256 |
+
"210": 16484,
|
257 |
+
"2100": 16552,
|
258 |
+
"211": 16431,
|
259 |
+
"212": 16419,
|
260 |
+
"213": 16415,
|
261 |
+
"214": 16515,
|
262 |
+
"215": 16621,
|
263 |
+
"216": 16743,
|
264 |
+
"217": 16497,
|
265 |
+
"218": 16418,
|
266 |
+
"219": 16476,
|
267 |
+
"220": 16403,
|
268 |
+
"2200": 16439,
|
269 |
+
"22000": 16501,
|
270 |
+
"221": 16661,
|
271 |
+
"222": 16434,
|
272 |
+
"223": 16436,
|
273 |
+
"224": 16533,
|
274 |
+
"225": 16462,
|
275 |
+
"226": 16530,
|
276 |
+
"227": 16525,
|
277 |
+
"228": 16503,
|
278 |
+
"230": 16433,
|
279 |
+
"2300": 16603,
|
280 |
+
"231": 16602,
|
281 |
+
"232": 16522,
|
282 |
+
"233": 16526,
|
283 |
+
"234": 16509,
|
284 |
+
"235": 16564,
|
285 |
+
"236": 16742,
|
286 |
+
"237": 16469,
|
287 |
+
"238": 16583,
|
288 |
+
"239": 16744,
|
289 |
+
"240": 16413,
|
290 |
+
"2400": 16385,
|
291 |
+
"241": 16586,
|
292 |
+
"243": 16485,
|
293 |
+
"244": 16498,
|
294 |
+
"245": 16561,
|
295 |
+
"246": 16558,
|
296 |
+
"247": 16559,
|
297 |
+
"248": 16562,
|
298 |
+
"249": 16560,
|
299 |
+
"2500": 16429,
|
300 |
+
"25000": 16397,
|
301 |
+
"250000": 16471,
|
302 |
+
"251": 16656,
|
303 |
+
"253": 16662,
|
304 |
+
"254": 16616,
|
305 |
+
"255": 16594,
|
306 |
+
"256": 16718,
|
307 |
+
"257": 16523,
|
308 |
+
"258": 16626,
|
309 |
+
"259": 16387,
|
310 |
+
"260": 16411,
|
311 |
+
"2600": 16430,
|
312 |
+
"261": 16627,
|
313 |
+
"262": 16421,
|
314 |
+
"263": 16457,
|
315 |
+
"264": 16516,
|
316 |
+
"265": 16536,
|
317 |
+
"266": 16628,
|
318 |
+
"267": 16719,
|
319 |
+
"268": 16507,
|
320 |
+
"269": 16605,
|
321 |
+
"270": 16520,
|
322 |
+
"271": 16787,
|
323 |
+
"272": 16658,
|
324 |
+
"273": 16789,
|
325 |
+
"275": 16508,
|
326 |
+
"278": 16473,
|
327 |
+
"280": 16404,
|
328 |
+
"281": 16608,
|
329 |
+
"282": 16623,
|
330 |
+
"283": 16432,
|
331 |
+
"285": 16617,
|
332 |
+
"286": 16555,
|
333 |
+
"287": 16660,
|
334 |
+
"290": 16659,
|
335 |
+
"291": 16784,
|
336 |
+
"293": 16612,
|
337 |
+
"294": 16639,
|
338 |
+
"295": 16640,
|
339 |
+
"296": 16478,
|
340 |
+
"299": 16604,
|
341 |
+
"300000": 16474,
|
342 |
+
"3000000": 16495,
|
343 |
+
"301": 16600,
|
344 |
+
"302": 16641,
|
345 |
+
"303": 16543,
|
346 |
+
"304": 16592,
|
347 |
+
"305": 16486,
|
348 |
+
"306": 16491,
|
349 |
+
"307": 16622,
|
350 |
+
"308": 16675,
|
351 |
+
"309": 16684,
|
352 |
+
"310": 16688,
|
353 |
+
"311": 16589,
|
354 |
+
"312": 16607,
|
355 |
+
"313": 16519,
|
356 |
+
"314": 16678,
|
357 |
+
"315": 16745,
|
358 |
+
"316": 16680,
|
359 |
+
"318": 16679,
|
360 |
+
"319": 16681,
|
361 |
+
"320": 16405,
|
362 |
+
"323": 16454,
|
363 |
+
"324": 16741,
|
364 |
+
"325": 16514,
|
365 |
+
"326": 16463,
|
366 |
+
"327": 16645,
|
367 |
+
"330": 16788,
|
368 |
+
"333": 16693,
|
369 |
+
"340": 16615,
|
370 |
+
"343": 16705,
|
371 |
+
"3500": 16440,
|
372 |
+
"35000": 16524,
|
373 |
+
"352": 16683,
|
374 |
+
"355": 16528,
|
375 |
+
"357": 16388,
|
376 |
+
"360": 16435,
|
377 |
+
"365": 16535,
|
378 |
+
"370": 16494,
|
379 |
+
"375": 16563,
|
380 |
+
"380": 16406,
|
381 |
+
"386": 16540,
|
382 |
+
"395": 16575,
|
383 |
+
"40000": 16395,
|
384 |
+
"400000": 16483,
|
385 |
+
"401": 16642,
|
386 |
+
"405": 16585,
|
387 |
+
"408": 16657,
|
388 |
+
"410": 16579,
|
389 |
+
"420": 16407,
|
390 |
+
"421": 16531,
|
391 |
+
"423": 16493,
|
392 |
+
"430": 16568,
|
393 |
+
"440": 16614,
|
394 |
+
"4400": 16577,
|
395 |
+
"441": 16632,
|
396 |
+
"450": 16402,
|
397 |
+
"4500": 16441,
|
398 |
+
"45000": 16470,
|
399 |
+
"460": 16619,
|
400 |
+
"480": 16408,
|
401 |
+
"481": 16630,
|
402 |
+
"550": 16409,
|
403 |
+
"60000": 16517,
|
404 |
+
"600000": 16500,
|
405 |
+
"650": 16422,
|
406 |
+
"6500": 16548,
|
407 |
+
"660": 16649,
|
408 |
+
"7000": 16442,
|
409 |
+
"70000": 16394,
|
410 |
+
"700000": 16467,
|
411 |
+
"720": 16448,
|
412 |
+
"727": 16808,
|
413 |
+
"737": 16806,
|
414 |
+
"747": 16492,
|
415 |
+
"750": 16438,
|
416 |
+
"7500": 16544,
|
417 |
+
"75000": 16606,
|
418 |
+
"777": 16740,
|
419 |
+
"8000": 16468,
|
420 |
+
"80000": 16593,
|
421 |
+
"800000": 16547,
|
422 |
+
"850": 16449,
|
423 |
+
"9000": 16518,
|
424 |
+
"90000": 16595,
|
425 |
+
"911": 16721,
|
426 |
+
"950": 16423,
|
427 |
+
"999": 16569,
|
428 |
+
"<|endoftext|>": 16384
|
|
|
429 |
}
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 392682336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c150e0b350f07cf568ff48fe1eb30059ec3e50454b5b418834dc0eae576757ae
|
3 |
size 392682336
|
tokenizer.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5496
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1f5d89d6ac20c7296ba53464c714e8bdab0613d048f74e0d7be23d39c017522
|
3 |
size 5496
|