Update README.md
Browse files
README.md
CHANGED
@@ -1,199 +1,337 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
|
15 |
-
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
|
20 |
-
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
|
25 |
-
|
26 |
-
|
27 |
-
|
28 |
-
|
29 |
-
|
30 |
-
|
31 |
-
|
32 |
-
|
33 |
-
|
34 |
-
|
35 |
-
|
36 |
-
|
37 |
-
|
38 |
-
|
39 |
-
|
40 |
-
|
41 |
-
|
42 |
-
|
43 |
-
|
44 |
-
|
45 |
-
|
46 |
-
|
47 |
-
|
48 |
-
|
49 |
-
|
50 |
-
|
51 |
-
|
52 |
-
|
53 |
-
|
54 |
-
|
55 |
-
|
56 |
-
|
57 |
-
|
58 |
-
|
59 |
-
|
60 |
-
|
61 |
-
|
62 |
-
|
63 |
-
|
64 |
-
|
65 |
-
|
66 |
-
|
67 |
-
|
68 |
-
|
69 |
-
|
70 |
-
|
71 |
-
|
72 |
-
|
73 |
-
|
74 |
-
|
75 |
-
|
76 |
-
|
77 |
-
|
78 |
-
|
79 |
-
|
80 |
-
|
81 |
-
|
82 |
-
|
83 |
-
|
84 |
-
|
85 |
-
|
86 |
-
|
87 |
-
|
88 |
-
|
89 |
-
|
90 |
-
|
91 |
-
|
92 |
-
|
93 |
-
|
94 |
-
|
95 |
-
|
96 |
-
|
97 |
-
|
98 |
-
|
99 |
-
|
100 |
-
|
101 |
-
|
102 |
-
|
103 |
-
|
104 |
-
|
105 |
-
|
106 |
-
|
107 |
-
|
108 |
-
|
109 |
-
|
110 |
-
|
111 |
-
|
112 |
-
|
113 |
-
|
114 |
-
|
115 |
-
|
116 |
-
|
117 |
-
|
118 |
-
|
119 |
-
|
120 |
-
|
121 |
-
|
122 |
-
|
123 |
-
|
124 |
-
|
125 |
-
|
126 |
-
|
127 |
-
|
128 |
-
|
129 |
-
|
130 |
-
|
131 |
-
|
132 |
-
|
133 |
-
|
134 |
-
|
135 |
-
|
136 |
-
|
137 |
-
|
138 |
-
|
139 |
-
|
140 |
-
|
141 |
-
|
142 |
-
|
143 |
-
|
144 |
-
|
145 |
-
|
146 |
-
|
147 |
-
|
148 |
-
|
149 |
-
|
150 |
-
|
151 |
-
|
152 |
-
|
153 |
-
|
154 |
-
|
155 |
-
|
156 |
-
|
157 |
-
|
158 |
-
|
159 |
-
|
160 |
-
|
161 |
-
|
162 |
-
|
163 |
-
|
164 |
-
|
165 |
-
|
166 |
-
|
167 |
-
|
168 |
-
|
169 |
-
|
170 |
-
|
171 |
-
|
172 |
-
|
173 |
-
|
174 |
-
|
175 |
-
|
176 |
-
|
177 |
-
|
178 |
-
|
179 |
-
|
180 |
-
|
181 |
-
|
182 |
-
|
183 |
-
|
184 |
-
|
185 |
-
|
186 |
-
|
187 |
-
|
188 |
-
|
189 |
-
|
190 |
-
|
191 |
-
|
192 |
-
|
193 |
-
|
194 |
-
|
195 |
-
|
196 |
-
|
197 |
-
|
198 |
-
|
199 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
## This model has been trained for 2 epochs using Unsloth on the Internal Knowledge Map dataset.
|
2 |
+
|
3 |
+
```
|
4 |
+
==((====))== Unsloth - 2x faster free finetuning | Num GPUs = 1
|
5 |
+
\\ /| Num examples = 2,614 | Num Epochs = 2
|
6 |
+
O^O/ \_/ \ Batch size per device = 4 | Gradient Accumulation steps = 4
|
7 |
+
\ / Total batch size = 16 | Total steps = 326
|
8 |
+
"-____-" Number of trainable parameters = 83,886,080
|
9 |
+
[326/326 09:13, Epoch 1/2]
|
10 |
+
Step Training Loss
|
11 |
+
1 3.122400
|
12 |
+
2 3.146700
|
13 |
+
3 3.077300
|
14 |
+
4 3.072800
|
15 |
+
5 3.052400
|
16 |
+
6 3.032800
|
17 |
+
7 3.040000
|
18 |
+
8 3.078500
|
19 |
+
9 3.054300
|
20 |
+
10 3.031500
|
21 |
+
11 3.022800
|
22 |
+
12 3.030600
|
23 |
+
13 3.034800
|
24 |
+
14 3.023000
|
25 |
+
15 3.010300
|
26 |
+
16 3.066700
|
27 |
+
17 3.009200
|
28 |
+
18 2.950200
|
29 |
+
19 2.972900
|
30 |
+
20 2.975500
|
31 |
+
21 2.975900
|
32 |
+
22 2.933600
|
33 |
+
23 2.949500
|
34 |
+
24 3.000900
|
35 |
+
25 2.878700
|
36 |
+
26 2.950200
|
37 |
+
27 2.893500
|
38 |
+
28 2.875300
|
39 |
+
29 2.976100
|
40 |
+
30 2.869200
|
41 |
+
31 2.911700
|
42 |
+
32 2.795500
|
43 |
+
33 2.799400
|
44 |
+
34 2.849400
|
45 |
+
35 2.809000
|
46 |
+
36 2.795200
|
47 |
+
37 2.805400
|
48 |
+
38 2.787700
|
49 |
+
39 2.749900
|
50 |
+
40 2.735900
|
51 |
+
41 2.829800
|
52 |
+
42 2.774600
|
53 |
+
43 2.716500
|
54 |
+
44 2.803900
|
55 |
+
45 2.657600
|
56 |
+
46 2.701500
|
57 |
+
47 2.638200
|
58 |
+
48 2.788100
|
59 |
+
49 2.600000
|
60 |
+
50 2.599400
|
61 |
+
51 2.564500
|
62 |
+
52 2.587100
|
63 |
+
53 2.541100
|
64 |
+
54 2.541300
|
65 |
+
55 2.565700
|
66 |
+
56 2.584000
|
67 |
+
57 2.583400
|
68 |
+
58 2.622200
|
69 |
+
59 2.484100
|
70 |
+
60 2.414400
|
71 |
+
61 2.435400
|
72 |
+
62 2.417200
|
73 |
+
63 2.519300
|
74 |
+
64 2.527100
|
75 |
+
65 2.419200
|
76 |
+
66 2.393400
|
77 |
+
67 2.350400
|
78 |
+
68 2.463400
|
79 |
+
69 2.427600
|
80 |
+
70 2.287600
|
81 |
+
71 2.290400
|
82 |
+
72 2.313200
|
83 |
+
73 2.252300
|
84 |
+
74 2.275400
|
85 |
+
75 2.251900
|
86 |
+
76 2.325800
|
87 |
+
77 2.174600
|
88 |
+
78 2.158100
|
89 |
+
79 2.215200
|
90 |
+
80 2.094500
|
91 |
+
81 2.239300
|
92 |
+
82 2.163100
|
93 |
+
83 2.239600
|
94 |
+
84 2.058000
|
95 |
+
85 2.099200
|
96 |
+
86 2.063500
|
97 |
+
87 2.042700
|
98 |
+
88 1.981600
|
99 |
+
89 2.005200
|
100 |
+
90 2.009200
|
101 |
+
91 1.971600
|
102 |
+
92 1.989700
|
103 |
+
93 1.957000
|
104 |
+
94 1.871600
|
105 |
+
95 1.928000
|
106 |
+
96 1.931000
|
107 |
+
97 1.812400
|
108 |
+
98 1.867900
|
109 |
+
99 1.745100
|
110 |
+
100 1.864200
|
111 |
+
101 1.708200
|
112 |
+
102 1.903700
|
113 |
+
103 1.789400
|
114 |
+
104 1.760100
|
115 |
+
105 1.636100
|
116 |
+
106 1.826100
|
117 |
+
107 1.816700
|
118 |
+
108 1.753400
|
119 |
+
109 1.760800
|
120 |
+
110 1.720400
|
121 |
+
111 1.511300
|
122 |
+
112 1.614200
|
123 |
+
113 1.632700
|
124 |
+
114 1.480100
|
125 |
+
115 1.548600
|
126 |
+
116 1.623400
|
127 |
+
117 1.629900
|
128 |
+
118 1.435100
|
129 |
+
119 1.460700
|
130 |
+
120 1.482000
|
131 |
+
121 1.305400
|
132 |
+
122 1.231600
|
133 |
+
123 1.581200
|
134 |
+
124 1.193100
|
135 |
+
125 1.216200
|
136 |
+
126 1.293600
|
137 |
+
127 1.158300
|
138 |
+
128 1.211200
|
139 |
+
129 1.184000
|
140 |
+
130 1.116600
|
141 |
+
131 1.146400
|
142 |
+
132 1.255100
|
143 |
+
133 1.085800
|
144 |
+
134 0.993300
|
145 |
+
135 1.134800
|
146 |
+
136 1.293100
|
147 |
+
137 1.377800
|
148 |
+
138 0.779900
|
149 |
+
139 0.889400
|
150 |
+
140 0.849800
|
151 |
+
141 1.080100
|
152 |
+
142 0.969100
|
153 |
+
143 1.034000
|
154 |
+
144 0.868000
|
155 |
+
145 0.727900
|
156 |
+
146 0.688100
|
157 |
+
147 0.870200
|
158 |
+
148 0.782700
|
159 |
+
149 0.672200
|
160 |
+
150 0.690100
|
161 |
+
151 0.665900
|
162 |
+
152 0.694800
|
163 |
+
153 0.642100
|
164 |
+
154 0.435800
|
165 |
+
155 0.575800
|
166 |
+
156 0.678400
|
167 |
+
157 0.540300
|
168 |
+
158 0.550200
|
169 |
+
159 0.652300
|
170 |
+
160 0.397500
|
171 |
+
161 0.839400
|
172 |
+
162 0.480400
|
173 |
+
163 0.533200
|
174 |
+
164 0.331800
|
175 |
+
165 0.470100
|
176 |
+
166 0.485200
|
177 |
+
167 0.350000
|
178 |
+
168 0.490200
|
179 |
+
169 0.353600
|
180 |
+
170 0.445700
|
181 |
+
171 0.461700
|
182 |
+
172 0.471700
|
183 |
+
173 0.217400
|
184 |
+
174 0.795300
|
185 |
+
175 0.276600
|
186 |
+
176 0.146400
|
187 |
+
177 0.776800
|
188 |
+
178 0.262800
|
189 |
+
179 0.276800
|
190 |
+
180 0.269000
|
191 |
+
181 0.256000
|
192 |
+
182 0.580300
|
193 |
+
183 0.223600
|
194 |
+
184 0.148800
|
195 |
+
185 0.309900
|
196 |
+
186 0.931900
|
197 |
+
187 0.177100
|
198 |
+
188 0.253300
|
199 |
+
189 0.669300
|
200 |
+
190 0.535500
|
201 |
+
191 0.180600
|
202 |
+
192 0.332300
|
203 |
+
193 0.498300
|
204 |
+
194 0.249200
|
205 |
+
195 0.532900
|
206 |
+
196 0.214900
|
207 |
+
197 0.453000
|
208 |
+
198 0.321500
|
209 |
+
199 0.230500
|
210 |
+
200 0.121200
|
211 |
+
201 0.243600
|
212 |
+
202 0.341000
|
213 |
+
203 0.303100
|
214 |
+
204 0.194500
|
215 |
+
205 0.379500
|
216 |
+
206 0.212300
|
217 |
+
207 0.728000
|
218 |
+
208 0.465900
|
219 |
+
209 0.168300
|
220 |
+
210 0.325700
|
221 |
+
211 0.083800
|
222 |
+
212 0.299700
|
223 |
+
213 0.578800
|
224 |
+
214 0.080600
|
225 |
+
215 0.181000
|
226 |
+
216 0.104500
|
227 |
+
217 0.425300
|
228 |
+
218 0.378300
|
229 |
+
219 0.150900
|
230 |
+
220 0.186100
|
231 |
+
221 0.297500
|
232 |
+
222 0.447000
|
233 |
+
223 0.350500
|
234 |
+
224 0.203000
|
235 |
+
225 0.154800
|
236 |
+
226 0.195300
|
237 |
+
227 0.036700
|
238 |
+
228 0.160900
|
239 |
+
229 0.330500
|
240 |
+
230 0.574200
|
241 |
+
231 0.526900
|
242 |
+
232 0.274500
|
243 |
+
233 0.388700
|
244 |
+
234 0.212200
|
245 |
+
235 0.251600
|
246 |
+
236 0.150400
|
247 |
+
237 0.460500
|
248 |
+
238 0.107800
|
249 |
+
239 0.097400
|
250 |
+
240 0.136000
|
251 |
+
241 0.390400
|
252 |
+
242 0.279900
|
253 |
+
243 0.507000
|
254 |
+
244 0.472500
|
255 |
+
245 0.354900
|
256 |
+
246 0.333400
|
257 |
+
247 0.305500
|
258 |
+
248 0.254900
|
259 |
+
249 0.251000
|
260 |
+
250 0.469400
|
261 |
+
251 0.364700
|
262 |
+
252 0.185600
|
263 |
+
253 0.150500
|
264 |
+
254 0.354000
|
265 |
+
255 0.133900
|
266 |
+
256 0.093200
|
267 |
+
257 0.297700
|
268 |
+
258 0.180200
|
269 |
+
259 0.216000
|
270 |
+
260 0.113900
|
271 |
+
261 0.283700
|
272 |
+
262 0.134100
|
273 |
+
263 0.033800
|
274 |
+
264 0.358600
|
275 |
+
265 0.453800
|
276 |
+
266 0.326100
|
277 |
+
267 0.166000
|
278 |
+
268 0.371600
|
279 |
+
269 0.129800
|
280 |
+
270 0.173600
|
281 |
+
271 0.161700
|
282 |
+
272 0.052800
|
283 |
+
273 0.140600
|
284 |
+
274 0.052200
|
285 |
+
275 0.392400
|
286 |
+
276 0.103700
|
287 |
+
277 0.206600
|
288 |
+
278 0.077600
|
289 |
+
279 0.267900
|
290 |
+
280 0.425900
|
291 |
+
281 0.033300
|
292 |
+
282 0.262400
|
293 |
+
283 0.163300
|
294 |
+
284 0.317800
|
295 |
+
285 0.394600
|
296 |
+
286 0.257400
|
297 |
+
287 0.207600
|
298 |
+
288 0.339600
|
299 |
+
289 0.309500
|
300 |
+
290 0.195000
|
301 |
+
291 0.362300
|
302 |
+
292 0.209900
|
303 |
+
293 0.278600
|
304 |
+
294 0.312100
|
305 |
+
295 0.203300
|
306 |
+
296 0.159400
|
307 |
+
297 0.108100
|
308 |
+
298 0.380800
|
309 |
+
299 0.200700
|
310 |
+
300 0.230700
|
311 |
+
301 0.333100
|
312 |
+
302 0.231800
|
313 |
+
303 0.168700
|
314 |
+
304 0.108700
|
315 |
+
305 0.093100
|
316 |
+
306 0.223000
|
317 |
+
307 0.174300
|
318 |
+
308 0.301100
|
319 |
+
309 0.317200
|
320 |
+
310 0.289300
|
321 |
+
311 0.033000
|
322 |
+
312 0.147200
|
323 |
+
313 0.211600
|
324 |
+
314 0.150000
|
325 |
+
315 0.069700
|
326 |
+
316 0.184500
|
327 |
+
317 0.041900
|
328 |
+
318 0.067700
|
329 |
+
319 0.113800
|
330 |
+
320 0.231100
|
331 |
+
321 0.139300
|
332 |
+
322 0.135500
|
333 |
+
323 0.190800
|
334 |
+
324 0.097400
|
335 |
+
325 0.087900
|
336 |
+
326 0.032600
|
337 |
+
```
|