Training in progress, step 10000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/rng_state_4.pth +1 -1
- last-checkpoint/rng_state_5.pth +1 -1
- last-checkpoint/rng_state_6.pth +1 -1
- last-checkpoint/rng_state_7.pth +1 -1
- last-checkpoint/text_renderer_config.json +17 -5
- last-checkpoint/trainer_state.json +93 -93
- last-checkpoint/training_args.bin +1 -1
- pytorch_model.bin +1 -1
- text_renderer_config.json +17 -5
- training_args.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 202193937
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec52caad045b3f34632491a3e60266fca49fb4a8996857ded69858dac82d39b4
|
3 |
size 202193937
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 102501541
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4934ec353ee8c0b201d8896e01193b73d8d525ed3d2c04d990e1d6af1e4f1ff
|
3 |
size 102501541
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/rng_state_4.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/rng_state_5.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/rng_state_6.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/rng_state_7.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:161364992086d421e640cb46d16fb2f26cefdd719c2e2fd276cf5231abbcc82c
|
3 |
size 14503
|
last-checkpoint/text_renderer_config.json
CHANGED
@@ -16,18 +16,20 @@
|
|
16 |
"Nimbus Roman",
|
17 |
"Nimbus Sans",
|
18 |
"Nimbus Sans Narrow",
|
|
|
|
|
19 |
"Noto Kufi Arabic",
|
20 |
-
"Noto Looped Lao",
|
21 |
-
"Noto Looped Lao UI",
|
22 |
"Noto Music",
|
23 |
"Noto Naskh Arabic",
|
24 |
"Noto Naskh Arabic UI",
|
25 |
"Noto Nastaliq Urdu",
|
26 |
"Noto Rashi Hebrew",
|
|
|
27 |
"Noto Sans Adlam",
|
28 |
"Noto Sans Adlam Unjoined",
|
29 |
"Noto Sans Anatolian Hieroglyphs",
|
30 |
"Noto Sans Arabic",
|
|
|
31 |
"Noto Sans Armenian",
|
32 |
"Noto Sans Avestan",
|
33 |
"Noto Sans Balinese",
|
@@ -86,12 +88,16 @@
|
|
86 |
"Noto Sans Kaithi",
|
87 |
"Noto Sans Kannada",
|
88 |
"Noto Sans Kannada UI",
|
|
|
89 |
"Noto Sans Kayah Li",
|
90 |
"Noto Sans Kharoshthi",
|
91 |
"Noto Sans Khmer",
|
92 |
"Noto Sans Khmer UI",
|
|
|
93 |
"Noto Sans Khudawadi",
|
94 |
"Noto Sans Lao",
|
|
|
|
|
95 |
"Noto Sans Lao UI",
|
96 |
"Noto Sans Lepcha",
|
97 |
"Noto Sans Limbu",
|
@@ -123,13 +129,15 @@
|
|
123 |
"Noto Sans Myanmar UI",
|
124 |
"Noto Sans NKo",
|
125 |
"Noto Sans Nabataean",
|
|
|
126 |
"Noto Sans Nandinagari",
|
127 |
"Noto Sans New Tai Lue",
|
128 |
"Noto Sans Newa",
|
129 |
"Noto Sans Nushu",
|
130 |
"Noto Sans Ogham",
|
131 |
-
"Noto Sans
|
132 |
"Noto Sans Old Hungarian",
|
|
|
133 |
"Noto Sans Old North Arabian",
|
134 |
"Noto Sans Old Permic",
|
135 |
"Noto Sans Old Persian",
|
@@ -142,7 +150,7 @@
|
|
142 |
"Noto Sans Pahawh Hmong",
|
143 |
"Noto Sans Palmyrene",
|
144 |
"Noto Sans Pau Cin Hau",
|
145 |
-
"Noto Sans
|
146 |
"Noto Sans Phoenician",
|
147 |
"Noto Sans Psalter Pahlavi",
|
148 |
"Noto Sans Rejang",
|
@@ -156,11 +164,15 @@
|
|
156 |
"Noto Sans Sinhala",
|
157 |
"Noto Sans Sinhala UI",
|
158 |
"Noto Sans Sogdian",
|
|
|
159 |
"Noto Sans Soyombo",
|
|
|
160 |
"Noto Sans Syloti Nagri",
|
161 |
"Noto Sans Symbols",
|
162 |
-
"Noto Sans
|
163 |
"Noto Sans Syriac",
|
|
|
|
|
164 |
"Noto Sans Tagalog",
|
165 |
"Noto Sans Tagbanwa",
|
166 |
"Noto Sans Tai Le",
|
|
|
16 |
"Nimbus Roman",
|
17 |
"Nimbus Sans",
|
18 |
"Nimbus Sans Narrow",
|
19 |
+
"Noto Fangsong KSS Rotated",
|
20 |
+
"Noto Fangsong KSS Vertical",
|
21 |
"Noto Kufi Arabic",
|
|
|
|
|
22 |
"Noto Music",
|
23 |
"Noto Naskh Arabic",
|
24 |
"Noto Naskh Arabic UI",
|
25 |
"Noto Nastaliq Urdu",
|
26 |
"Noto Rashi Hebrew",
|
27 |
+
"Noto Sans",
|
28 |
"Noto Sans Adlam",
|
29 |
"Noto Sans Adlam Unjoined",
|
30 |
"Noto Sans Anatolian Hieroglyphs",
|
31 |
"Noto Sans Arabic",
|
32 |
+
"Noto Sans Arabic UI",
|
33 |
"Noto Sans Armenian",
|
34 |
"Noto Sans Avestan",
|
35 |
"Noto Sans Balinese",
|
|
|
88 |
"Noto Sans Kaithi",
|
89 |
"Noto Sans Kannada",
|
90 |
"Noto Sans Kannada UI",
|
91 |
+
"Noto Sans Kawi",
|
92 |
"Noto Sans Kayah Li",
|
93 |
"Noto Sans Kharoshthi",
|
94 |
"Noto Sans Khmer",
|
95 |
"Noto Sans Khmer UI",
|
96 |
+
"Noto Sans Khojki",
|
97 |
"Noto Sans Khudawadi",
|
98 |
"Noto Sans Lao",
|
99 |
+
"Noto Sans Lao Looped",
|
100 |
+
"Noto Sans Lao Looped UI",
|
101 |
"Noto Sans Lao UI",
|
102 |
"Noto Sans Lepcha",
|
103 |
"Noto Sans Limbu",
|
|
|
129 |
"Noto Sans Myanmar UI",
|
130 |
"Noto Sans NKo",
|
131 |
"Noto Sans Nabataean",
|
132 |
+
"Noto Sans Nag Mundari",
|
133 |
"Noto Sans Nandinagari",
|
134 |
"Noto Sans New Tai Lue",
|
135 |
"Noto Sans Newa",
|
136 |
"Noto Sans Nushu",
|
137 |
"Noto Sans Ogham",
|
138 |
+
"Noto Sans Ol Chiki",
|
139 |
"Noto Sans Old Hungarian",
|
140 |
+
"Noto Sans Old Italic",
|
141 |
"Noto Sans Old North Arabian",
|
142 |
"Noto Sans Old Permic",
|
143 |
"Noto Sans Old Persian",
|
|
|
150 |
"Noto Sans Pahawh Hmong",
|
151 |
"Noto Sans Palmyrene",
|
152 |
"Noto Sans Pau Cin Hau",
|
153 |
+
"Noto Sans Phags-Pa",
|
154 |
"Noto Sans Phoenician",
|
155 |
"Noto Sans Psalter Pahlavi",
|
156 |
"Noto Sans Rejang",
|
|
|
164 |
"Noto Sans Sinhala",
|
165 |
"Noto Sans Sinhala UI",
|
166 |
"Noto Sans Sogdian",
|
167 |
+
"Noto Sans Sora Sompeng",
|
168 |
"Noto Sans Soyombo",
|
169 |
+
"Noto Sans Sundanese",
|
170 |
"Noto Sans Syloti Nagri",
|
171 |
"Noto Sans Symbols",
|
172 |
+
"Noto Sans Symbols 2",
|
173 |
"Noto Sans Syriac",
|
174 |
+
"Noto Sans Syriac Eastern",
|
175 |
+
"Noto Sans Syriac Western",
|
176 |
"Noto Sans Tagalog",
|
177 |
"Noto Sans Tagbanwa",
|
178 |
"Noto Sans Tai Le",
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,216 +1,216 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
"global_step": 10000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
9 |
"log_history": [
|
10 |
{
|
11 |
-
"epoch": 0.
|
12 |
"learning_rate": 5.999999999999999e-06,
|
13 |
-
"loss": 0.
|
14 |
"step": 500
|
15 |
},
|
16 |
{
|
17 |
-
"epoch": 0.
|
18 |
"learning_rate": 1.1999999999999999e-05,
|
19 |
-
"loss": 0.
|
20 |
"step": 1000
|
21 |
},
|
22 |
{
|
23 |
-
"epoch": 0.
|
24 |
-
"eval_loss": 0.
|
25 |
-
"eval_runtime": 1.
|
26 |
-
"eval_samples_per_second":
|
27 |
-
"eval_steps_per_second":
|
28 |
"step": 1000
|
29 |
},
|
30 |
{
|
31 |
-
"epoch": 0.
|
32 |
"learning_rate": 1.7999999999999997e-05,
|
33 |
-
"loss": 0.
|
34 |
"step": 1500
|
35 |
},
|
36 |
{
|
37 |
-
"epoch": 0.
|
38 |
"learning_rate": 2.3999999999999997e-05,
|
39 |
-
"loss": 0.
|
40 |
"step": 2000
|
41 |
},
|
42 |
{
|
43 |
-
"epoch": 0.
|
44 |
-
"eval_loss": 0.
|
45 |
-
"eval_runtime": 1.
|
46 |
-
"eval_samples_per_second":
|
47 |
-
"eval_steps_per_second":
|
48 |
"step": 2000
|
49 |
},
|
50 |
{
|
51 |
-
"epoch": 0.
|
52 |
"learning_rate": 2.9999999999999997e-05,
|
53 |
-
"loss": 0.
|
54 |
"step": 2500
|
55 |
},
|
56 |
{
|
57 |
-
"epoch": 0.
|
58 |
"learning_rate": 3.5999999999999994e-05,
|
59 |
-
"loss": 0.
|
60 |
"step": 3000
|
61 |
},
|
62 |
{
|
63 |
-
"epoch": 0.
|
64 |
-
"eval_loss": 0.
|
65 |
-
"eval_runtime": 1.
|
66 |
-
"eval_samples_per_second":
|
67 |
-
"eval_steps_per_second":
|
68 |
"step": 3000
|
69 |
},
|
70 |
{
|
71 |
-
"epoch":
|
72 |
"learning_rate": 4.2e-05,
|
73 |
-
"loss": 0.
|
74 |
"step": 3500
|
75 |
},
|
76 |
{
|
77 |
-
"epoch":
|
78 |
"learning_rate": 4.7999999999999994e-05,
|
79 |
-
"loss": 0.
|
80 |
"step": 4000
|
81 |
},
|
82 |
{
|
83 |
-
"epoch":
|
84 |
-
"eval_loss": 0.
|
85 |
-
"eval_runtime": 1.
|
86 |
-
"eval_samples_per_second":
|
87 |
-
"eval_steps_per_second":
|
88 |
"step": 4000
|
89 |
},
|
90 |
{
|
91 |
-
"epoch": 1
|
92 |
"learning_rate": 5.399999999999999e-05,
|
93 |
-
"loss": 0.
|
94 |
"step": 4500
|
95 |
},
|
96 |
{
|
97 |
-
"epoch":
|
98 |
"learning_rate": 5.9999999999999995e-05,
|
99 |
-
"loss": 0.
|
100 |
"step": 5000
|
101 |
},
|
102 |
{
|
103 |
-
"epoch":
|
104 |
-
"eval_loss": 0.
|
105 |
-
"eval_runtime": 1.
|
106 |
-
"eval_samples_per_second":
|
107 |
-
"eval_steps_per_second":
|
108 |
"step": 5000
|
109 |
},
|
110 |
{
|
111 |
-
"epoch":
|
112 |
"learning_rate": 6.599999999999999e-05,
|
113 |
-
"loss": 0.
|
114 |
"step": 5500
|
115 |
},
|
116 |
{
|
117 |
-
"epoch":
|
118 |
"learning_rate": 7.199999999999999e-05,
|
119 |
-
"loss": 0.
|
120 |
"step": 6000
|
121 |
},
|
122 |
{
|
123 |
-
"epoch":
|
124 |
-
"eval_loss": 0.
|
125 |
-
"eval_runtime": 1.
|
126 |
-
"eval_samples_per_second":
|
127 |
-
"eval_steps_per_second":
|
128 |
"step": 6000
|
129 |
},
|
130 |
{
|
131 |
-
"epoch":
|
132 |
"learning_rate": 7.8e-05,
|
133 |
-
"loss": 0.
|
134 |
"step": 6500
|
135 |
},
|
136 |
{
|
137 |
-
"epoch":
|
138 |
"learning_rate": 8.4e-05,
|
139 |
-
"loss": 0.
|
140 |
"step": 7000
|
141 |
},
|
142 |
{
|
143 |
-
"epoch":
|
144 |
-
"eval_loss": 0.
|
145 |
-
"eval_runtime": 1.
|
146 |
-
"eval_samples_per_second":
|
147 |
-
"eval_steps_per_second":
|
148 |
"step": 7000
|
149 |
},
|
150 |
{
|
151 |
-
"epoch":
|
152 |
"learning_rate": 8.999999999999999e-05,
|
153 |
-
"loss": 0.
|
154 |
"step": 7500
|
155 |
},
|
156 |
{
|
157 |
-
"epoch":
|
158 |
"learning_rate": 9.599999999999999e-05,
|
159 |
-
"loss": 0.
|
160 |
"step": 8000
|
161 |
},
|
162 |
{
|
163 |
-
"epoch":
|
164 |
-
"eval_loss": 0.
|
165 |
-
"eval_runtime": 1.
|
166 |
-
"eval_samples_per_second":
|
167 |
-
"eval_steps_per_second":
|
168 |
"step": 8000
|
169 |
},
|
170 |
{
|
171 |
-
"epoch":
|
172 |
"learning_rate": 0.000102,
|
173 |
-
"loss": 0.
|
174 |
"step": 8500
|
175 |
},
|
176 |
{
|
177 |
-
"epoch": 2
|
178 |
"learning_rate": 0.00010799999999999998,
|
179 |
-
"loss": 0.
|
180 |
"step": 9000
|
181 |
},
|
182 |
{
|
183 |
-
"epoch": 2
|
184 |
-
"eval_loss": 0.
|
185 |
-
"eval_runtime": 1.
|
186 |
-
"eval_samples_per_second":
|
187 |
-
"eval_steps_per_second":
|
188 |
"step": 9000
|
189 |
},
|
190 |
{
|
191 |
-
"epoch":
|
192 |
"learning_rate": 0.00011399999999999999,
|
193 |
-
"loss": 0.
|
194 |
"step": 9500
|
195 |
},
|
196 |
{
|
197 |
-
"epoch":
|
198 |
"learning_rate": 0.00011999999999999999,
|
199 |
-
"loss": 0.
|
200 |
"step": 10000
|
201 |
},
|
202 |
{
|
203 |
-
"epoch":
|
204 |
-
"eval_loss": 0.
|
205 |
-
"eval_runtime": 1.
|
206 |
-
"eval_samples_per_second":
|
207 |
-
"eval_steps_per_second":
|
208 |
"step": 10000
|
209 |
}
|
210 |
],
|
211 |
"max_steps": 500000,
|
212 |
-
"num_train_epochs":
|
213 |
-
"total_flos": 3.
|
214 |
"trial_name": null,
|
215 |
"trial_params": null
|
216 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.22305496074232692,
|
5 |
"global_step": 10000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
9 |
"log_history": [
|
10 |
{
|
11 |
+
"epoch": 0.01,
|
12 |
"learning_rate": 5.999999999999999e-06,
|
13 |
+
"loss": 0.9165,
|
14 |
"step": 500
|
15 |
},
|
16 |
{
|
17 |
+
"epoch": 0.02,
|
18 |
"learning_rate": 1.1999999999999999e-05,
|
19 |
+
"loss": 0.7051,
|
20 |
"step": 1000
|
21 |
},
|
22 |
{
|
23 |
+
"epoch": 0.02,
|
24 |
+
"eval_loss": 0.6818633079528809,
|
25 |
+
"eval_runtime": 1.9324,
|
26 |
+
"eval_samples_per_second": 1188.697,
|
27 |
+
"eval_steps_per_second": 18.63,
|
28 |
"step": 1000
|
29 |
},
|
30 |
{
|
31 |
+
"epoch": 0.03,
|
32 |
"learning_rate": 1.7999999999999997e-05,
|
33 |
+
"loss": 0.6818,
|
34 |
"step": 1500
|
35 |
},
|
36 |
{
|
37 |
+
"epoch": 0.04,
|
38 |
"learning_rate": 2.3999999999999997e-05,
|
39 |
+
"loss": 0.6808,
|
40 |
"step": 2000
|
41 |
},
|
42 |
{
|
43 |
+
"epoch": 0.04,
|
44 |
+
"eval_loss": 0.6788448691368103,
|
45 |
+
"eval_runtime": 1.762,
|
46 |
+
"eval_samples_per_second": 1303.62,
|
47 |
+
"eval_steps_per_second": 20.431,
|
48 |
"step": 2000
|
49 |
},
|
50 |
{
|
51 |
+
"epoch": 0.06,
|
52 |
"learning_rate": 2.9999999999999997e-05,
|
53 |
+
"loss": 0.6804,
|
54 |
"step": 2500
|
55 |
},
|
56 |
{
|
57 |
+
"epoch": 0.07,
|
58 |
"learning_rate": 3.5999999999999994e-05,
|
59 |
+
"loss": 0.6803,
|
60 |
"step": 3000
|
61 |
},
|
62 |
{
|
63 |
+
"epoch": 0.07,
|
64 |
+
"eval_loss": 0.678871750831604,
|
65 |
+
"eval_runtime": 1.9035,
|
66 |
+
"eval_samples_per_second": 1206.735,
|
67 |
+
"eval_steps_per_second": 18.913,
|
68 |
"step": 3000
|
69 |
},
|
70 |
{
|
71 |
+
"epoch": 0.08,
|
72 |
"learning_rate": 4.2e-05,
|
73 |
+
"loss": 0.6801,
|
74 |
"step": 3500
|
75 |
},
|
76 |
{
|
77 |
+
"epoch": 0.09,
|
78 |
"learning_rate": 4.7999999999999994e-05,
|
79 |
+
"loss": 0.68,
|
80 |
"step": 4000
|
81 |
},
|
82 |
{
|
83 |
+
"epoch": 0.09,
|
84 |
+
"eval_loss": 0.6781899333000183,
|
85 |
+
"eval_runtime": 1.9139,
|
86 |
+
"eval_samples_per_second": 1200.176,
|
87 |
+
"eval_steps_per_second": 18.81,
|
88 |
"step": 4000
|
89 |
},
|
90 |
{
|
91 |
+
"epoch": 0.1,
|
92 |
"learning_rate": 5.399999999999999e-05,
|
93 |
+
"loss": 0.6798,
|
94 |
"step": 4500
|
95 |
},
|
96 |
{
|
97 |
+
"epoch": 0.11,
|
98 |
"learning_rate": 5.9999999999999995e-05,
|
99 |
+
"loss": 0.6796,
|
100 |
"step": 5000
|
101 |
},
|
102 |
{
|
103 |
+
"epoch": 0.11,
|
104 |
+
"eval_loss": 0.6784412860870361,
|
105 |
+
"eval_runtime": 1.8311,
|
106 |
+
"eval_samples_per_second": 1254.405,
|
107 |
+
"eval_steps_per_second": 19.66,
|
108 |
"step": 5000
|
109 |
},
|
110 |
{
|
111 |
+
"epoch": 0.12,
|
112 |
"learning_rate": 6.599999999999999e-05,
|
113 |
+
"loss": 0.6792,
|
114 |
"step": 5500
|
115 |
},
|
116 |
{
|
117 |
+
"epoch": 0.13,
|
118 |
"learning_rate": 7.199999999999999e-05,
|
119 |
+
"loss": 0.6788,
|
120 |
"step": 6000
|
121 |
},
|
122 |
{
|
123 |
+
"epoch": 0.13,
|
124 |
+
"eval_loss": 0.67804354429245,
|
125 |
+
"eval_runtime": 1.8509,
|
126 |
+
"eval_samples_per_second": 1240.986,
|
127 |
+
"eval_steps_per_second": 19.449,
|
128 |
"step": 6000
|
129 |
},
|
130 |
{
|
131 |
+
"epoch": 0.14,
|
132 |
"learning_rate": 7.8e-05,
|
133 |
+
"loss": 0.6783,
|
134 |
"step": 6500
|
135 |
},
|
136 |
{
|
137 |
+
"epoch": 0.16,
|
138 |
"learning_rate": 8.4e-05,
|
139 |
+
"loss": 0.678,
|
140 |
"step": 7000
|
141 |
},
|
142 |
{
|
143 |
+
"epoch": 0.16,
|
144 |
+
"eval_loss": 0.6776260733604431,
|
145 |
+
"eval_runtime": 1.8893,
|
146 |
+
"eval_samples_per_second": 1215.825,
|
147 |
+
"eval_steps_per_second": 19.055,
|
148 |
"step": 7000
|
149 |
},
|
150 |
{
|
151 |
+
"epoch": 0.17,
|
152 |
"learning_rate": 8.999999999999999e-05,
|
153 |
+
"loss": 0.6778,
|
154 |
"step": 7500
|
155 |
},
|
156 |
{
|
157 |
+
"epoch": 0.18,
|
158 |
"learning_rate": 9.599999999999999e-05,
|
159 |
+
"loss": 0.678,
|
160 |
"step": 8000
|
161 |
},
|
162 |
{
|
163 |
+
"epoch": 0.18,
|
164 |
+
"eval_loss": 0.6782737374305725,
|
165 |
+
"eval_runtime": 1.8707,
|
166 |
+
"eval_samples_per_second": 1227.889,
|
167 |
+
"eval_steps_per_second": 19.244,
|
168 |
"step": 8000
|
169 |
},
|
170 |
{
|
171 |
+
"epoch": 0.19,
|
172 |
"learning_rate": 0.000102,
|
173 |
+
"loss": 0.6783,
|
174 |
"step": 8500
|
175 |
},
|
176 |
{
|
177 |
+
"epoch": 0.2,
|
178 |
"learning_rate": 0.00010799999999999998,
|
179 |
+
"loss": 0.6672,
|
180 |
"step": 9000
|
181 |
},
|
182 |
{
|
183 |
+
"epoch": 0.2,
|
184 |
+
"eval_loss": 0.6526092290878296,
|
185 |
+
"eval_runtime": 1.8141,
|
186 |
+
"eval_samples_per_second": 1266.219,
|
187 |
+
"eval_steps_per_second": 19.845,
|
188 |
"step": 9000
|
189 |
},
|
190 |
{
|
191 |
+
"epoch": 0.21,
|
192 |
"learning_rate": 0.00011399999999999999,
|
193 |
+
"loss": 0.6453,
|
194 |
"step": 9500
|
195 |
},
|
196 |
{
|
197 |
+
"epoch": 0.22,
|
198 |
"learning_rate": 0.00011999999999999999,
|
199 |
+
"loss": 0.632,
|
200 |
"step": 10000
|
201 |
},
|
202 |
{
|
203 |
+
"epoch": 0.22,
|
204 |
+
"eval_loss": 0.6212196350097656,
|
205 |
+
"eval_runtime": 1.9366,
|
206 |
+
"eval_samples_per_second": 1186.109,
|
207 |
+
"eval_steps_per_second": 18.589,
|
208 |
"step": 10000
|
209 |
}
|
210 |
],
|
211 |
"max_steps": 500000,
|
212 |
+
"num_train_epochs": 12,
|
213 |
+
"total_flos": 3.194871387745e+20,
|
214 |
"trial_name": null,
|
215 |
"trial_params": null
|
216 |
}
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3311
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:229efc1d49e061de5d19e6e496114be212e29dd2150b027ea46959c2a5a56c0b
|
3 |
size 3311
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 102501541
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4934ec353ee8c0b201d8896e01193b73d8d525ed3d2c04d990e1d6af1e4f1ff
|
3 |
size 102501541
|
text_renderer_config.json
CHANGED
@@ -16,18 +16,20 @@
|
|
16 |
"Nimbus Roman",
|
17 |
"Nimbus Sans",
|
18 |
"Nimbus Sans Narrow",
|
|
|
|
|
19 |
"Noto Kufi Arabic",
|
20 |
-
"Noto Looped Lao",
|
21 |
-
"Noto Looped Lao UI",
|
22 |
"Noto Music",
|
23 |
"Noto Naskh Arabic",
|
24 |
"Noto Naskh Arabic UI",
|
25 |
"Noto Nastaliq Urdu",
|
26 |
"Noto Rashi Hebrew",
|
|
|
27 |
"Noto Sans Adlam",
|
28 |
"Noto Sans Adlam Unjoined",
|
29 |
"Noto Sans Anatolian Hieroglyphs",
|
30 |
"Noto Sans Arabic",
|
|
|
31 |
"Noto Sans Armenian",
|
32 |
"Noto Sans Avestan",
|
33 |
"Noto Sans Balinese",
|
@@ -86,12 +88,16 @@
|
|
86 |
"Noto Sans Kaithi",
|
87 |
"Noto Sans Kannada",
|
88 |
"Noto Sans Kannada UI",
|
|
|
89 |
"Noto Sans Kayah Li",
|
90 |
"Noto Sans Kharoshthi",
|
91 |
"Noto Sans Khmer",
|
92 |
"Noto Sans Khmer UI",
|
|
|
93 |
"Noto Sans Khudawadi",
|
94 |
"Noto Sans Lao",
|
|
|
|
|
95 |
"Noto Sans Lao UI",
|
96 |
"Noto Sans Lepcha",
|
97 |
"Noto Sans Limbu",
|
@@ -123,13 +129,15 @@
|
|
123 |
"Noto Sans Myanmar UI",
|
124 |
"Noto Sans NKo",
|
125 |
"Noto Sans Nabataean",
|
|
|
126 |
"Noto Sans Nandinagari",
|
127 |
"Noto Sans New Tai Lue",
|
128 |
"Noto Sans Newa",
|
129 |
"Noto Sans Nushu",
|
130 |
"Noto Sans Ogham",
|
131 |
-
"Noto Sans
|
132 |
"Noto Sans Old Hungarian",
|
|
|
133 |
"Noto Sans Old North Arabian",
|
134 |
"Noto Sans Old Permic",
|
135 |
"Noto Sans Old Persian",
|
@@ -142,7 +150,7 @@
|
|
142 |
"Noto Sans Pahawh Hmong",
|
143 |
"Noto Sans Palmyrene",
|
144 |
"Noto Sans Pau Cin Hau",
|
145 |
-
"Noto Sans
|
146 |
"Noto Sans Phoenician",
|
147 |
"Noto Sans Psalter Pahlavi",
|
148 |
"Noto Sans Rejang",
|
@@ -156,11 +164,15 @@
|
|
156 |
"Noto Sans Sinhala",
|
157 |
"Noto Sans Sinhala UI",
|
158 |
"Noto Sans Sogdian",
|
|
|
159 |
"Noto Sans Soyombo",
|
|
|
160 |
"Noto Sans Syloti Nagri",
|
161 |
"Noto Sans Symbols",
|
162 |
-
"Noto Sans
|
163 |
"Noto Sans Syriac",
|
|
|
|
|
164 |
"Noto Sans Tagalog",
|
165 |
"Noto Sans Tagbanwa",
|
166 |
"Noto Sans Tai Le",
|
|
|
16 |
"Nimbus Roman",
|
17 |
"Nimbus Sans",
|
18 |
"Nimbus Sans Narrow",
|
19 |
+
"Noto Fangsong KSS Rotated",
|
20 |
+
"Noto Fangsong KSS Vertical",
|
21 |
"Noto Kufi Arabic",
|
|
|
|
|
22 |
"Noto Music",
|
23 |
"Noto Naskh Arabic",
|
24 |
"Noto Naskh Arabic UI",
|
25 |
"Noto Nastaliq Urdu",
|
26 |
"Noto Rashi Hebrew",
|
27 |
+
"Noto Sans",
|
28 |
"Noto Sans Adlam",
|
29 |
"Noto Sans Adlam Unjoined",
|
30 |
"Noto Sans Anatolian Hieroglyphs",
|
31 |
"Noto Sans Arabic",
|
32 |
+
"Noto Sans Arabic UI",
|
33 |
"Noto Sans Armenian",
|
34 |
"Noto Sans Avestan",
|
35 |
"Noto Sans Balinese",
|
|
|
88 |
"Noto Sans Kaithi",
|
89 |
"Noto Sans Kannada",
|
90 |
"Noto Sans Kannada UI",
|
91 |
+
"Noto Sans Kawi",
|
92 |
"Noto Sans Kayah Li",
|
93 |
"Noto Sans Kharoshthi",
|
94 |
"Noto Sans Khmer",
|
95 |
"Noto Sans Khmer UI",
|
96 |
+
"Noto Sans Khojki",
|
97 |
"Noto Sans Khudawadi",
|
98 |
"Noto Sans Lao",
|
99 |
+
"Noto Sans Lao Looped",
|
100 |
+
"Noto Sans Lao Looped UI",
|
101 |
"Noto Sans Lao UI",
|
102 |
"Noto Sans Lepcha",
|
103 |
"Noto Sans Limbu",
|
|
|
129 |
"Noto Sans Myanmar UI",
|
130 |
"Noto Sans NKo",
|
131 |
"Noto Sans Nabataean",
|
132 |
+
"Noto Sans Nag Mundari",
|
133 |
"Noto Sans Nandinagari",
|
134 |
"Noto Sans New Tai Lue",
|
135 |
"Noto Sans Newa",
|
136 |
"Noto Sans Nushu",
|
137 |
"Noto Sans Ogham",
|
138 |
+
"Noto Sans Ol Chiki",
|
139 |
"Noto Sans Old Hungarian",
|
140 |
+
"Noto Sans Old Italic",
|
141 |
"Noto Sans Old North Arabian",
|
142 |
"Noto Sans Old Permic",
|
143 |
"Noto Sans Old Persian",
|
|
|
150 |
"Noto Sans Pahawh Hmong",
|
151 |
"Noto Sans Palmyrene",
|
152 |
"Noto Sans Pau Cin Hau",
|
153 |
+
"Noto Sans Phags-Pa",
|
154 |
"Noto Sans Phoenician",
|
155 |
"Noto Sans Psalter Pahlavi",
|
156 |
"Noto Sans Rejang",
|
|
|
164 |
"Noto Sans Sinhala",
|
165 |
"Noto Sans Sinhala UI",
|
166 |
"Noto Sans Sogdian",
|
167 |
+
"Noto Sans Sora Sompeng",
|
168 |
"Noto Sans Soyombo",
|
169 |
+
"Noto Sans Sundanese",
|
170 |
"Noto Sans Syloti Nagri",
|
171 |
"Noto Sans Symbols",
|
172 |
+
"Noto Sans Symbols 2",
|
173 |
"Noto Sans Syriac",
|
174 |
+
"Noto Sans Syriac Eastern",
|
175 |
+
"Noto Sans Syriac Western",
|
176 |
"Noto Sans Tagalog",
|
177 |
"Noto Sans Tagbanwa",
|
178 |
"Noto Sans Tai Le",
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3311
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:229efc1d49e061de5d19e6e496114be212e29dd2150b027ea46959c2a5a56c0b
|
3 |
size 3311
|