File size: 120,249 Bytes
c34aa36 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 |
{"current_steps": 5, "total_steps": 2341, "loss": 1.0426, "learning_rate": 4.999943721137594e-05, "epoch": 0.002135383301302584, "percentage": 0.21, "elapsed_time": "0:01:56", "remaining_time": "15:04:16", "throughput": 1094.22, "total_tokens": 127072}
{"current_steps": 10, "total_steps": 2341, "loss": 1.0578, "learning_rate": 4.999774887084225e-05, "epoch": 0.004270766602605168, "percentage": 0.43, "elapsed_time": "0:04:12", "remaining_time": "16:22:42", "throughput": 1113.77, "total_tokens": 281728}
{"current_steps": 15, "total_steps": 2341, "loss": 0.6602, "learning_rate": 4.999493505441324e-05, "epoch": 0.0064061499039077515, "percentage": 0.64, "elapsed_time": "0:05:56", "remaining_time": "15:20:09", "throughput": 1107.49, "total_tokens": 394304}
{"current_steps": 20, "total_steps": 2341, "loss": 0.961, "learning_rate": 4.9990995888775614e-05, "epoch": 0.008541533205210335, "percentage": 0.85, "elapsed_time": "0:08:25", "remaining_time": "16:17:42", "throughput": 1111.56, "total_tokens": 561888}
{"current_steps": 25, "total_steps": 2341, "loss": 0.9722, "learning_rate": 4.9985931551282785e-05, "epoch": 0.010676916506512918, "percentage": 1.07, "elapsed_time": "0:10:47", "remaining_time": "16:40:24", "throughput": 1115.08, "total_tokens": 722496}
{"current_steps": 30, "total_steps": 2341, "loss": 0.7008, "learning_rate": 4.997974226994687e-05, "epoch": 0.012812299807815503, "percentage": 1.28, "elapsed_time": "0:12:43", "remaining_time": "16:19:41", "throughput": 1114.17, "total_tokens": 850176}
{"current_steps": 35, "total_steps": 2341, "loss": 0.9035, "learning_rate": 4.9972428323428444e-05, "epoch": 0.014947683109118086, "percentage": 1.5, "elapsed_time": "0:15:09", "remaining_time": "16:38:39", "throughput": 1118.56, "total_tokens": 1017280}
{"current_steps": 40, "total_steps": 2341, "loss": 0.868, "learning_rate": 4.996399004102397e-05, "epoch": 0.01708306641042067, "percentage": 1.71, "elapsed_time": "0:17:48", "remaining_time": "17:04:46", "throughput": 1122.28, "total_tokens": 1199552}
{"current_steps": 45, "total_steps": 2341, "loss": 0.7532, "learning_rate": 4.9954427802651014e-05, "epoch": 0.019218449711723255, "percentage": 1.92, "elapsed_time": "0:19:56", "remaining_time": "16:57:43", "throughput": 1122.78, "total_tokens": 1343744}
{"current_steps": 50, "total_steps": 2341, "loss": 0.7994, "learning_rate": 4.9943742038831076e-05, "epoch": 0.021353833013025837, "percentage": 2.14, "elapsed_time": "0:22:25", "remaining_time": "17:07:29", "throughput": 1125.19, "total_tokens": 1513920}
{"current_steps": 55, "total_steps": 2341, "loss": 0.8082, "learning_rate": 4.993193323067027e-05, "epoch": 0.02348921631432842, "percentage": 2.35, "elapsed_time": "0:24:53", "remaining_time": "17:14:17", "throughput": 1125.26, "total_tokens": 1680096}
{"current_steps": 60, "total_steps": 2341, "loss": 0.7103, "learning_rate": 4.9919001909837625e-05, "epoch": 0.025624599615631006, "percentage": 2.56, "elapsed_time": "0:27:24", "remaining_time": "17:22:08", "throughput": 1126.79, "total_tokens": 1853312}
{"current_steps": 65, "total_steps": 2341, "loss": 0.6723, "learning_rate": 4.990494865854116e-05, "epoch": 0.02775998291693359, "percentage": 2.78, "elapsed_time": "0:29:41", "remaining_time": "17:19:38", "throughput": 1126.62, "total_tokens": 2007040}
{"current_steps": 70, "total_steps": 2341, "loss": 0.6473, "learning_rate": 4.9889774109501675e-05, "epoch": 0.029895366218236172, "percentage": 2.99, "elapsed_time": "0:31:31", "remaining_time": "17:02:40", "throughput": 1124.83, "total_tokens": 2127456}
{"current_steps": 75, "total_steps": 2341, "loss": 0.8123, "learning_rate": 4.987347894592426e-05, "epoch": 0.032030749519538756, "percentage": 3.2, "elapsed_time": "0:33:44", "remaining_time": "16:59:27", "throughput": 1124.71, "total_tokens": 2276992}
{"current_steps": 80, "total_steps": 2341, "loss": 0.8803, "learning_rate": 4.985606390146752e-05, "epoch": 0.03416613282084134, "percentage": 3.42, "elapsed_time": "0:36:28", "remaining_time": "17:11:00", "throughput": 1125.64, "total_tokens": 2463776}
{"current_steps": 85, "total_steps": 2341, "loss": 0.7062, "learning_rate": 4.983752976021058e-05, "epoch": 0.036301516122143926, "percentage": 3.63, "elapsed_time": "0:38:44", "remaining_time": "17:08:22", "throughput": 1126.68, "total_tokens": 2619296}
{"current_steps": 90, "total_steps": 2341, "loss": 0.7329, "learning_rate": 4.981787735661774e-05, "epoch": 0.03843689942344651, "percentage": 3.84, "elapsed_time": "0:41:28", "remaining_time": "17:17:17", "throughput": 1128.23, "total_tokens": 2807456}
{"current_steps": 95, "total_steps": 2341, "loss": 0.708, "learning_rate": 4.9797107575500934e-05, "epoch": 0.040572282724749095, "percentage": 4.06, "elapsed_time": "0:44:02", "remaining_time": "17:21:12", "throughput": 1128.73, "total_tokens": 2982592}
{"current_steps": 100, "total_steps": 2341, "loss": 0.686, "learning_rate": 4.977522135197988e-05, "epoch": 0.04270766602605167, "percentage": 4.27, "elapsed_time": "0:46:05", "remaining_time": "17:12:51", "throughput": 1127.59, "total_tokens": 3118176}
{"current_steps": 105, "total_steps": 2341, "loss": 0.8154, "learning_rate": 4.975221967144e-05, "epoch": 0.04484304932735426, "percentage": 4.49, "elapsed_time": "0:49:00", "remaining_time": "17:23:28", "throughput": 1128.74, "total_tokens": 3318528}
{"current_steps": 110, "total_steps": 2341, "loss": 0.7786, "learning_rate": 4.972810356948803e-05, "epoch": 0.04697843262865684, "percentage": 4.7, "elapsed_time": "0:50:56", "remaining_time": "17:13:14", "throughput": 1127.53, "total_tokens": 3446496}
{"current_steps": 115, "total_steps": 2341, "loss": 0.848, "learning_rate": 4.9702874131905375e-05, "epoch": 0.04911381592995943, "percentage": 4.91, "elapsed_time": "0:53:39", "remaining_time": "17:18:42", "throughput": 1128.53, "total_tokens": 3633536}
{"current_steps": 120, "total_steps": 2341, "loss": 0.6415, "learning_rate": 4.967653249459928e-05, "epoch": 0.05124919923126201, "percentage": 5.13, "elapsed_time": "0:56:04", "remaining_time": "17:17:53", "throughput": 1128.78, "total_tokens": 3797920}
{"current_steps": 125, "total_steps": 2341, "loss": 0.885, "learning_rate": 4.9649079843551663e-05, "epoch": 0.053384582532564596, "percentage": 5.34, "elapsed_time": "0:58:35", "remaining_time": "17:18:51", "throughput": 1129.78, "total_tokens": 3972288}
{"current_steps": 130, "total_steps": 2341, "loss": 0.7594, "learning_rate": 4.9620517414765685e-05, "epoch": 0.05551996583386718, "percentage": 5.55, "elapsed_time": "1:01:15", "remaining_time": "17:21:57", "throughput": 1130.5, "total_tokens": 4155520}
{"current_steps": 135, "total_steps": 2341, "loss": 0.5479, "learning_rate": 4.959084649421016e-05, "epoch": 0.057655349135169766, "percentage": 5.77, "elapsed_time": "1:03:40", "remaining_time": "17:20:32", "throughput": 1130.55, "total_tokens": 4319488}
{"current_steps": 140, "total_steps": 2341, "loss": 0.7997, "learning_rate": 4.9560068417761595e-05, "epoch": 0.059790732436472344, "percentage": 5.98, "elapsed_time": "1:05:56", "remaining_time": "17:16:46", "throughput": 1130.49, "total_tokens": 4473120}
{"current_steps": 145, "total_steps": 2341, "loss": 0.7524, "learning_rate": 4.952818457114411e-05, "epoch": 0.06192611573777493, "percentage": 6.19, "elapsed_time": "1:08:01", "remaining_time": "17:10:09", "throughput": 1130.24, "total_tokens": 4612768}
{"current_steps": 150, "total_steps": 2341, "loss": 0.7524, "learning_rate": 4.9495196389866995e-05, "epoch": 0.06406149903907751, "percentage": 6.41, "elapsed_time": "1:10:03", "remaining_time": "17:03:19", "throughput": 1129.45, "total_tokens": 4747680}
{"current_steps": 155, "total_steps": 2341, "loss": 0.7265, "learning_rate": 4.946110535916009e-05, "epoch": 0.0661968823403801, "percentage": 6.62, "elapsed_time": "1:12:53", "remaining_time": "17:08:05", "throughput": 1130.18, "total_tokens": 4943264}
{"current_steps": 160, "total_steps": 2341, "loss": 0.6025, "learning_rate": 4.942591301390695e-05, "epoch": 0.06833226564168268, "percentage": 6.83, "elapsed_time": "1:15:01", "remaining_time": "17:02:37", "throughput": 1129.78, "total_tokens": 5085408}
{"current_steps": 165, "total_steps": 2341, "loss": 0.6499, "learning_rate": 4.9389620938575695e-05, "epoch": 0.07046764894298527, "percentage": 7.05, "elapsed_time": "1:17:30", "remaining_time": "17:02:15", "throughput": 1130.17, "total_tokens": 5256288}
{"current_steps": 170, "total_steps": 2341, "loss": 0.723, "learning_rate": 4.935223076714769e-05, "epoch": 0.07260303224428785, "percentage": 7.26, "elapsed_time": "1:20:09", "remaining_time": "17:03:39", "throughput": 1130.55, "total_tokens": 5437312}
{"current_steps": 175, "total_steps": 2341, "loss": 0.7537, "learning_rate": 4.9313744183044e-05, "epoch": 0.07473841554559044, "percentage": 7.48, "elapsed_time": "1:22:08", "remaining_time": "16:56:39", "throughput": 1129.95, "total_tokens": 5568800}
{"current_steps": 180, "total_steps": 2341, "loss": 0.7523, "learning_rate": 4.927416291904955e-05, "epoch": 0.07687379884689302, "percentage": 7.69, "elapsed_time": "1:24:27", "remaining_time": "16:53:57", "throughput": 1129.09, "total_tokens": 5721568}
{"current_steps": 185, "total_steps": 2341, "loss": 0.6245, "learning_rate": 4.9233488757235145e-05, "epoch": 0.0790091821481956, "percentage": 7.9, "elapsed_time": "1:26:42", "remaining_time": "16:50:27", "throughput": 1129.18, "total_tokens": 5874336}
{"current_steps": 190, "total_steps": 2341, "loss": 0.7379, "learning_rate": 4.919172352887725e-05, "epoch": 0.08114456544949819, "percentage": 8.12, "elapsed_time": "1:29:01", "remaining_time": "16:47:54", "throughput": 1129.2, "total_tokens": 6031904}
{"current_steps": 195, "total_steps": 2341, "loss": 0.6706, "learning_rate": 4.914886911437547e-05, "epoch": 0.08327994875080078, "percentage": 8.33, "elapsed_time": "1:31:30", "remaining_time": "16:47:06", "throughput": 1129.38, "total_tokens": 6201152}
{"current_steps": 200, "total_steps": 2341, "loss": 0.6494, "learning_rate": 4.910492744316799e-05, "epoch": 0.08541533205210335, "percentage": 8.54, "elapsed_time": "1:33:47", "remaining_time": "16:44:05", "throughput": 1129.47, "total_tokens": 6356416}
{"current_steps": 205, "total_steps": 2341, "loss": 0.7371, "learning_rate": 4.905990049364461e-05, "epoch": 0.08755071535340593, "percentage": 8.76, "elapsed_time": "1:35:56", "remaining_time": "16:39:40", "throughput": 1129.55, "total_tokens": 6502272}
{"current_steps": 210, "total_steps": 2341, "loss": 0.7105, "learning_rate": 4.9013790293057714e-05, "epoch": 0.08968609865470852, "percentage": 8.97, "elapsed_time": "1:38:16", "remaining_time": "16:37:19", "throughput": 1129.82, "total_tokens": 6662432}
{"current_steps": 215, "total_steps": 2341, "loss": 0.6886, "learning_rate": 4.8966598917431036e-05, "epoch": 0.0918214819560111, "percentage": 9.18, "elapsed_time": "1:40:40", "remaining_time": "16:35:33", "throughput": 1129.99, "total_tokens": 6826048}
{"current_steps": 220, "total_steps": 2341, "loss": 0.6842, "learning_rate": 4.8918328491466106e-05, "epoch": 0.09395686525731368, "percentage": 9.4, "elapsed_time": "1:43:09", "remaining_time": "16:34:34", "throughput": 1129.76, "total_tokens": 6992928}
{"current_steps": 225, "total_steps": 2341, "loss": 0.733, "learning_rate": 4.886898118844666e-05, "epoch": 0.09609224855861627, "percentage": 9.61, "elapsed_time": "1:45:10", "remaining_time": "16:29:05", "throughput": 1129.69, "total_tokens": 7128704}
{"current_steps": 230, "total_steps": 2341, "loss": 0.5728, "learning_rate": 4.881855923014076e-05, "epoch": 0.09822763185991885, "percentage": 9.82, "elapsed_time": "1:47:14", "remaining_time": "16:24:17", "throughput": 1129.3, "total_tokens": 7266464}
{"current_steps": 235, "total_steps": 2341, "loss": 0.6706, "learning_rate": 4.876706488670077e-05, "epoch": 0.10036301516122144, "percentage": 10.04, "elapsed_time": "1:49:39", "remaining_time": "16:22:47", "throughput": 1129.32, "total_tokens": 7430912}
{"current_steps": 240, "total_steps": 2341, "loss": 0.6395, "learning_rate": 4.871450047656114e-05, "epoch": 0.10249839846252402, "percentage": 10.25, "elapsed_time": "1:51:36", "remaining_time": "16:17:06", "throughput": 1128.91, "total_tokens": 7560288}
{"current_steps": 245, "total_steps": 2341, "loss": 0.6815, "learning_rate": 4.866086836633403e-05, "epoch": 0.10463378176382661, "percentage": 10.47, "elapsed_time": "1:53:49", "remaining_time": "16:13:43", "throughput": 1128.77, "total_tokens": 7708480}
{"current_steps": 250, "total_steps": 2341, "loss": 0.8152, "learning_rate": 4.860617097070278e-05, "epoch": 0.10676916506512919, "percentage": 10.68, "elapsed_time": "1:56:12", "remaining_time": "16:11:57", "throughput": 1128.89, "total_tokens": 7871168}
{"current_steps": 255, "total_steps": 2341, "loss": 0.7163, "learning_rate": 4.855041075231314e-05, "epoch": 0.10890454836643178, "percentage": 10.89, "elapsed_time": "1:58:18", "remaining_time": "16:07:48", "throughput": 1128.58, "total_tokens": 8011264}
{"current_steps": 260, "total_steps": 2341, "loss": 0.73, "learning_rate": 4.8493590221662436e-05, "epoch": 0.11103993166773436, "percentage": 11.11, "elapsed_time": "2:00:23", "remaining_time": "16:03:33", "throughput": 1128.62, "total_tokens": 8152320}
{"current_steps": 265, "total_steps": 2341, "loss": 0.8089, "learning_rate": 4.843571193698653e-05, "epoch": 0.11317531496903695, "percentage": 11.32, "elapsed_time": "2:02:30", "remaining_time": "15:59:43", "throughput": 1128.26, "total_tokens": 8293312}
{"current_steps": 270, "total_steps": 2341, "loss": 0.6812, "learning_rate": 4.837677850414464e-05, "epoch": 0.11531069827033953, "percentage": 11.53, "elapsed_time": "2:05:08", "remaining_time": "15:59:55", "throughput": 1128.39, "total_tokens": 8472896}
{"current_steps": 275, "total_steps": 2341, "loss": 0.7619, "learning_rate": 4.8316792576502004e-05, "epoch": 0.11744608157164212, "percentage": 11.75, "elapsed_time": "2:07:39", "remaining_time": "15:59:01", "throughput": 1128.52, "total_tokens": 8643552}
{"current_steps": 280, "total_steps": 2341, "loss": 0.7461, "learning_rate": 4.825575685481045e-05, "epoch": 0.11958146487294469, "percentage": 11.96, "elapsed_time": "2:10:00", "remaining_time": "15:56:58", "throughput": 1128.71, "total_tokens": 8804736}
{"current_steps": 285, "total_steps": 2341, "loss": 0.8225, "learning_rate": 4.819367408708676e-05, "epoch": 0.12171684817424727, "percentage": 12.17, "elapsed_time": "2:12:10", "remaining_time": "15:53:27", "throughput": 1128.83, "total_tokens": 8951648}
{"current_steps": 290, "total_steps": 2341, "loss": 0.7792, "learning_rate": 4.8130547068488954e-05, "epoch": 0.12385223147554986, "percentage": 12.39, "elapsed_time": "2:14:19", "remaining_time": "15:50:02", "throughput": 1128.71, "total_tokens": 9097312}
{"current_steps": 295, "total_steps": 2341, "loss": 0.8316, "learning_rate": 4.806637864119049e-05, "epoch": 0.12598761477685244, "percentage": 12.6, "elapsed_time": "2:16:23", "remaining_time": "15:45:54", "throughput": 1128.52, "total_tokens": 9234688}
{"current_steps": 300, "total_steps": 2341, "loss": 0.7616, "learning_rate": 4.800117169425223e-05, "epoch": 0.12812299807815503, "percentage": 12.82, "elapsed_time": "2:18:56", "remaining_time": "15:45:13", "throughput": 1128.88, "total_tokens": 9410528}
{"current_steps": 305, "total_steps": 2341, "loss": 0.7982, "learning_rate": 4.79349291634924e-05, "epoch": 0.1302583813794576, "percentage": 13.03, "elapsed_time": "2:21:35", "remaining_time": "15:45:13", "throughput": 1129.18, "total_tokens": 9593280}
{"current_steps": 310, "total_steps": 2341, "loss": 0.7515, "learning_rate": 4.786765403135444e-05, "epoch": 0.1323937646807602, "percentage": 13.24, "elapsed_time": "2:24:10", "remaining_time": "15:44:34", "throughput": 1129.4, "total_tokens": 9769824}
{"current_steps": 315, "total_steps": 2341, "loss": 0.6677, "learning_rate": 4.779934932677265e-05, "epoch": 0.13452914798206278, "percentage": 13.46, "elapsed_time": "2:26:27", "remaining_time": "15:42:00", "throughput": 1129.02, "total_tokens": 9921536}
{"current_steps": 320, "total_steps": 2341, "loss": 0.7559, "learning_rate": 4.77300181250359e-05, "epoch": 0.13666453128336536, "percentage": 13.67, "elapsed_time": "2:28:53", "remaining_time": "15:40:23", "throughput": 1129.3, "total_tokens": 10089088}
{"current_steps": 325, "total_steps": 2341, "loss": 0.7337, "learning_rate": 4.7659663547649124e-05, "epoch": 0.13879991458466795, "percentage": 13.88, "elapsed_time": "2:31:41", "remaining_time": "15:40:54", "throughput": 1129.79, "total_tokens": 10282272}
{"current_steps": 330, "total_steps": 2341, "loss": 0.8009, "learning_rate": 4.758828876219278e-05, "epoch": 0.14093529788597053, "percentage": 14.1, "elapsed_time": "2:34:09", "remaining_time": "15:39:23", "throughput": 1129.93, "total_tokens": 10450848}
{"current_steps": 335, "total_steps": 2341, "loss": 0.7203, "learning_rate": 4.751589698218026e-05, "epoch": 0.14307068118727312, "percentage": 14.31, "elapsed_time": "2:36:36", "remaining_time": "15:37:47", "throughput": 1129.95, "total_tokens": 10617664}
{"current_steps": 340, "total_steps": 2341, "loss": 0.5286, "learning_rate": 4.744249146691317e-05, "epoch": 0.1452060644885757, "percentage": 14.52, "elapsed_time": "2:39:14", "remaining_time": "15:37:08", "throughput": 1129.87, "total_tokens": 10794880}
{"current_steps": 345, "total_steps": 2341, "loss": 0.6662, "learning_rate": 4.736807552133464e-05, "epoch": 0.1473414477898783, "percentage": 14.74, "elapsed_time": "2:41:38", "remaining_time": "15:35:09", "throughput": 1129.79, "total_tokens": 10956960}
{"current_steps": 350, "total_steps": 2341, "loss": 0.6554, "learning_rate": 4.729265249588046e-05, "epoch": 0.14947683109118087, "percentage": 14.95, "elapsed_time": "2:43:50", "remaining_time": "15:32:01", "throughput": 1129.69, "total_tokens": 11105440}
{"current_steps": 355, "total_steps": 2341, "loss": 0.7981, "learning_rate": 4.721622578632832e-05, "epoch": 0.15161221439248346, "percentage": 15.16, "elapsed_time": "2:45:58", "remaining_time": "15:28:32", "throughput": 1129.51, "total_tokens": 11248448}
{"current_steps": 360, "total_steps": 2341, "loss": 0.5976, "learning_rate": 4.71387988336448e-05, "epoch": 0.15374759769378604, "percentage": 15.38, "elapsed_time": "2:48:17", "remaining_time": "15:26:07", "throughput": 1129.43, "total_tokens": 11404928}
{"current_steps": 365, "total_steps": 2341, "loss": 0.7783, "learning_rate": 4.706037512383058e-05, "epoch": 0.15588298099508863, "percentage": 15.59, "elapsed_time": "2:50:56", "remaining_time": "15:25:25", "throughput": 1129.72, "total_tokens": 11586880}
{"current_steps": 370, "total_steps": 2341, "loss": 0.6556, "learning_rate": 4.6980958187763394e-05, "epoch": 0.1580183642963912, "percentage": 15.81, "elapsed_time": "2:53:15", "remaining_time": "15:22:55", "throughput": 1129.98, "total_tokens": 11746368}
{"current_steps": 375, "total_steps": 2341, "loss": 0.5951, "learning_rate": 4.690055160103908e-05, "epoch": 0.1601537475976938, "percentage": 16.02, "elapsed_time": "2:55:12", "remaining_time": "15:18:34", "throughput": 1129.78, "total_tokens": 11876928}
{"current_steps": 380, "total_steps": 2341, "loss": 0.7438, "learning_rate": 4.681915898381064e-05, "epoch": 0.16228913089899638, "percentage": 16.23, "elapsed_time": "2:58:02", "remaining_time": "15:18:48", "throughput": 1129.92, "total_tokens": 12070656}
{"current_steps": 385, "total_steps": 2341, "loss": 0.861, "learning_rate": 4.67367840006252e-05, "epoch": 0.16442451420029897, "percentage": 16.45, "elapsed_time": "3:00:12", "remaining_time": "15:15:32", "throughput": 1129.74, "total_tokens": 12215104}
{"current_steps": 390, "total_steps": 2341, "loss": 0.597, "learning_rate": 4.6653430360259015e-05, "epoch": 0.16655989750160155, "percentage": 16.66, "elapsed_time": "3:02:27", "remaining_time": "15:12:46", "throughput": 1129.7, "total_tokens": 12367616}
{"current_steps": 395, "total_steps": 2341, "loss": 0.6786, "learning_rate": 4.656910181555055e-05, "epoch": 0.16869528080290414, "percentage": 16.87, "elapsed_time": "3:05:06", "remaining_time": "15:11:57", "throughput": 1129.99, "total_tokens": 12550368}
{"current_steps": 400, "total_steps": 2341, "loss": 0.6539, "learning_rate": 4.648380216323145e-05, "epoch": 0.1708306641042067, "percentage": 17.09, "elapsed_time": "3:07:15", "remaining_time": "15:08:39", "throughput": 1129.77, "total_tokens": 12693248}
{"current_steps": 405, "total_steps": 2341, "loss": 0.8733, "learning_rate": 4.639753524375564e-05, "epoch": 0.17296604740550928, "percentage": 17.3, "elapsed_time": "3:09:41", "remaining_time": "15:06:44", "throughput": 1129.66, "total_tokens": 12856832}
{"current_steps": 410, "total_steps": 2341, "loss": 0.636, "learning_rate": 4.631030494112638e-05, "epoch": 0.17510143070681186, "percentage": 17.51, "elapsed_time": "3:12:10", "remaining_time": "15:05:08", "throughput": 1129.85, "total_tokens": 13028352}
{"current_steps": 415, "total_steps": 2341, "loss": 0.7299, "learning_rate": 4.622211518272144e-05, "epoch": 0.17723681400811445, "percentage": 17.73, "elapsed_time": "3:14:10", "remaining_time": "15:01:10", "throughput": 1129.85, "total_tokens": 13163616}
{"current_steps": 420, "total_steps": 2341, "loss": 0.5954, "learning_rate": 4.613296993911623e-05, "epoch": 0.17937219730941703, "percentage": 17.94, "elapsed_time": "3:16:42", "remaining_time": "14:59:40", "throughput": 1130.01, "total_tokens": 13336608}
{"current_steps": 425, "total_steps": 2341, "loss": 0.8243, "learning_rate": 4.604287322390509e-05, "epoch": 0.18150758061071962, "percentage": 18.15, "elapsed_time": "3:19:08", "remaining_time": "14:57:47", "throughput": 1130.28, "total_tokens": 13505408}
{"current_steps": 430, "total_steps": 2341, "loss": 0.5552, "learning_rate": 4.59518290935205e-05, "epoch": 0.1836429639120222, "percentage": 18.37, "elapsed_time": "3:21:12", "remaining_time": "14:54:11", "throughput": 1130.08, "total_tokens": 13642592}
{"current_steps": 435, "total_steps": 2341, "loss": 0.6857, "learning_rate": 4.5859841647050565e-05, "epoch": 0.18577834721332478, "percentage": 18.58, "elapsed_time": "3:23:24", "remaining_time": "14:51:16", "throughput": 1129.96, "total_tokens": 13790976}
{"current_steps": 440, "total_steps": 2341, "loss": 0.6743, "learning_rate": 4.576691502605434e-05, "epoch": 0.18791373051462737, "percentage": 18.8, "elapsed_time": "3:25:49", "remaining_time": "14:49:16", "throughput": 1130.08, "total_tokens": 13956224}
{"current_steps": 445, "total_steps": 2341, "loss": 0.579, "learning_rate": 4.5673053414375436e-05, "epoch": 0.19004911381592995, "percentage": 19.01, "elapsed_time": "3:28:12", "remaining_time": "14:47:05", "throughput": 1129.92, "total_tokens": 14115296}
{"current_steps": 450, "total_steps": 2341, "loss": 0.8965, "learning_rate": 4.557826103795364e-05, "epoch": 0.19218449711723254, "percentage": 19.22, "elapsed_time": "3:30:25", "remaining_time": "14:44:14", "throughput": 1130.04, "total_tokens": 14267168}
{"current_steps": 455, "total_steps": 2341, "loss": 0.8137, "learning_rate": 4.548254216463465e-05, "epoch": 0.19431988041853512, "percentage": 19.44, "elapsed_time": "3:32:33", "remaining_time": "14:41:05", "throughput": 1130.11, "total_tokens": 14413312}
{"current_steps": 460, "total_steps": 2341, "loss": 0.617, "learning_rate": 4.538590110397789e-05, "epoch": 0.1964552637198377, "percentage": 19.65, "elapsed_time": "3:34:37", "remaining_time": "14:37:39", "throughput": 1129.91, "total_tokens": 14550880}
{"current_steps": 465, "total_steps": 2341, "loss": 0.9175, "learning_rate": 4.528834220706253e-05, "epoch": 0.1985906470211403, "percentage": 19.86, "elapsed_time": "3:36:42", "remaining_time": "14:34:15", "throughput": 1129.95, "total_tokens": 14691712}
{"current_steps": 470, "total_steps": 2341, "loss": 0.7633, "learning_rate": 4.518986986629157e-05, "epoch": 0.20072603032244288, "percentage": 20.08, "elapsed_time": "3:39:10", "remaining_time": "14:32:29", "throughput": 1130.12, "total_tokens": 14861408}
{"current_steps": 475, "total_steps": 2341, "loss": 0.6935, "learning_rate": 4.509048851519404e-05, "epoch": 0.20286141362374546, "percentage": 20.29, "elapsed_time": "3:41:18", "remaining_time": "14:29:22", "throughput": 1129.92, "total_tokens": 15003328}
{"current_steps": 480, "total_steps": 2341, "loss": 0.6322, "learning_rate": 4.499020262822547e-05, "epoch": 0.20499679692504805, "percentage": 20.5, "elapsed_time": "3:43:08", "remaining_time": "14:25:09", "throughput": 1129.74, "total_tokens": 15125792}
{"current_steps": 485, "total_steps": 2341, "loss": 0.9118, "learning_rate": 4.4889016720566355e-05, "epoch": 0.20713218022635063, "percentage": 20.72, "elapsed_time": "3:45:42", "remaining_time": "14:23:43", "throughput": 1129.93, "total_tokens": 15301856}
{"current_steps": 490, "total_steps": 2341, "loss": 0.6331, "learning_rate": 4.478693534791893e-05, "epoch": 0.20926756352765322, "percentage": 20.93, "elapsed_time": "3:48:25", "remaining_time": "14:22:51", "throughput": 1130.05, "total_tokens": 15487488}
{"current_steps": 495, "total_steps": 2341, "loss": 0.7326, "learning_rate": 4.4683963106302e-05, "epoch": 0.2114029468289558, "percentage": 21.14, "elapsed_time": "3:50:53", "remaining_time": "14:21:04", "throughput": 1130.2, "total_tokens": 15657312}
{"current_steps": 500, "total_steps": 2341, "loss": 0.6806, "learning_rate": 4.458010463184405e-05, "epoch": 0.21353833013025839, "percentage": 21.36, "elapsed_time": "3:53:40", "remaining_time": "14:20:25", "throughput": 1130.52, "total_tokens": 15850912}
{"current_steps": 505, "total_steps": 2341, "loss": 0.7017, "learning_rate": 4.4475364600574535e-05, "epoch": 0.21567371343156097, "percentage": 21.57, "elapsed_time": "3:55:42", "remaining_time": "14:16:56", "throughput": 1130.39, "total_tokens": 15986400}
{"current_steps": 510, "total_steps": 2341, "loss": 0.6438, "learning_rate": 4.43697477282133e-05, "epoch": 0.21780909673286356, "percentage": 21.79, "elapsed_time": "3:58:01", "remaining_time": "14:14:35", "throughput": 1130.44, "total_tokens": 16144960}
{"current_steps": 515, "total_steps": 2341, "loss": 0.757, "learning_rate": 4.4263258769958274e-05, "epoch": 0.21994448003416614, "percentage": 22.0, "elapsed_time": "4:00:11", "remaining_time": "14:11:38", "throughput": 1130.33, "total_tokens": 16289856}
{"current_steps": 520, "total_steps": 2341, "loss": 0.6478, "learning_rate": 4.415590252027141e-05, "epoch": 0.22207986333546872, "percentage": 22.21, "elapsed_time": "4:02:25", "remaining_time": "14:08:56", "throughput": 1130.21, "total_tokens": 16439328}
{"current_steps": 525, "total_steps": 2341, "loss": 0.7572, "learning_rate": 4.404768381266279e-05, "epoch": 0.2242152466367713, "percentage": 22.43, "elapsed_time": "4:04:26", "remaining_time": "14:05:32", "throughput": 1130.15, "total_tokens": 16575552}
{"current_steps": 530, "total_steps": 2341, "loss": 0.7073, "learning_rate": 4.393860751947302e-05, "epoch": 0.2263506299380739, "percentage": 22.64, "elapsed_time": "4:07:01", "remaining_time": "14:04:05", "throughput": 1130.36, "total_tokens": 16754016}
{"current_steps": 535, "total_steps": 2341, "loss": 0.6275, "learning_rate": 4.382867855165386e-05, "epoch": 0.22848601323937648, "percentage": 22.85, "elapsed_time": "4:09:09", "remaining_time": "14:01:05", "throughput": 1130.28, "total_tokens": 16897248}
{"current_steps": 540, "total_steps": 2341, "loss": 0.6937, "learning_rate": 4.371790185854709e-05, "epoch": 0.23062139654067906, "percentage": 23.07, "elapsed_time": "4:11:46", "remaining_time": "13:59:41", "throughput": 1130.52, "total_tokens": 17077792}
{"current_steps": 545, "total_steps": 2341, "loss": 0.7242, "learning_rate": 4.360628242766175e-05, "epoch": 0.23275677984198165, "percentage": 23.28, "elapsed_time": "4:14:03", "remaining_time": "13:57:13", "throughput": 1130.49, "total_tokens": 17232480}
{"current_steps": 550, "total_steps": 2341, "loss": 0.6462, "learning_rate": 4.3493825284449515e-05, "epoch": 0.23489216314328423, "percentage": 23.49, "elapsed_time": "4:16:06", "remaining_time": "13:53:59", "throughput": 1130.43, "total_tokens": 17371008}
{"current_steps": 555, "total_steps": 2341, "loss": 0.6891, "learning_rate": 4.338053549207844e-05, "epoch": 0.2370275464445868, "percentage": 23.71, "elapsed_time": "4:18:03", "remaining_time": "13:50:26", "throughput": 1130.37, "total_tokens": 17502016}
{"current_steps": 560, "total_steps": 2341, "loss": 0.6293, "learning_rate": 4.326641815120505e-05, "epoch": 0.23916292974588937, "percentage": 23.92, "elapsed_time": "4:20:24", "remaining_time": "13:48:11", "throughput": 1130.38, "total_tokens": 17661632}
{"current_steps": 565, "total_steps": 2341, "loss": 0.7189, "learning_rate": 4.315147839974464e-05, "epoch": 0.24129831304719196, "percentage": 24.13, "elapsed_time": "4:22:13", "remaining_time": "13:44:16", "throughput": 1130.17, "total_tokens": 17781440}
{"current_steps": 570, "total_steps": 2341, "loss": 0.6933, "learning_rate": 4.303572141263997e-05, "epoch": 0.24343369634849454, "percentage": 24.35, "elapsed_time": "4:25:09", "remaining_time": "13:43:51", "throughput": 1130.37, "total_tokens": 17983840}
{"current_steps": 575, "total_steps": 2341, "loss": 0.6973, "learning_rate": 4.2919152401628284e-05, "epoch": 0.24556907964979713, "percentage": 24.56, "elapsed_time": "4:27:50", "remaining_time": "13:42:36", "throughput": 1130.46, "total_tokens": 18166592}
{"current_steps": 580, "total_steps": 2341, "loss": 0.5742, "learning_rate": 4.2801776615006644e-05, "epoch": 0.2477044629510997, "percentage": 24.78, "elapsed_time": "4:29:53", "remaining_time": "13:39:25", "throughput": 1130.29, "total_tokens": 18302912}
{"current_steps": 585, "total_steps": 2341, "loss": 0.6087, "learning_rate": 4.2683599337395655e-05, "epoch": 0.2498398462524023, "percentage": 24.99, "elapsed_time": "4:32:19", "remaining_time": "13:37:26", "throughput": 1130.34, "total_tokens": 18469344}
{"current_steps": 590, "total_steps": 2341, "loss": 0.6595, "learning_rate": 4.2564625889501496e-05, "epoch": 0.2519752295537049, "percentage": 25.2, "elapsed_time": "4:34:17", "remaining_time": "13:34:01", "throughput": 1130.15, "total_tokens": 18599104}
{"current_steps": 595, "total_steps": 2341, "loss": 0.7353, "learning_rate": 4.2444861627876444e-05, "epoch": 0.25411061285500747, "percentage": 25.42, "elapsed_time": "4:36:57", "remaining_time": "13:32:43", "throughput": 1130.47, "total_tokens": 18785696}
{"current_steps": 600, "total_steps": 2341, "loss": 0.8322, "learning_rate": 4.2324311944677585e-05, "epoch": 0.25624599615631005, "percentage": 25.63, "elapsed_time": "4:39:38", "remaining_time": "13:31:25", "throughput": 1130.76, "total_tokens": 18972224}
{"current_steps": 605, "total_steps": 2341, "loss": 0.6534, "learning_rate": 4.220298226742415e-05, "epoch": 0.25838137945761264, "percentage": 25.84, "elapsed_time": "4:41:39", "remaining_time": "13:28:13", "throughput": 1130.65, "total_tokens": 19107968}
{"current_steps": 610, "total_steps": 2341, "loss": 0.7441, "learning_rate": 4.208087805875314e-05, "epoch": 0.2605167627589152, "percentage": 26.06, "elapsed_time": "4:44:22", "remaining_time": "13:26:57", "throughput": 1130.87, "total_tokens": 19295072}
{"current_steps": 615, "total_steps": 2341, "loss": 0.816, "learning_rate": 4.195800481617328e-05, "epoch": 0.2626521460602178, "percentage": 26.27, "elapsed_time": "4:46:31", "remaining_time": "13:24:07", "throughput": 1130.82, "total_tokens": 19440384}
{"current_steps": 620, "total_steps": 2341, "loss": 0.7341, "learning_rate": 4.183436807181765e-05, "epoch": 0.2647875293615204, "percentage": 26.48, "elapsed_time": "4:49:09", "remaining_time": "13:22:38", "throughput": 1130.85, "total_tokens": 19619680}
{"current_steps": 625, "total_steps": 2341, "loss": 0.6835, "learning_rate": 4.17099733921945e-05, "epoch": 0.266922912662823, "percentage": 26.7, "elapsed_time": "4:51:14", "remaining_time": "13:19:38", "throughput": 1130.73, "total_tokens": 19759200}
{"current_steps": 630, "total_steps": 2341, "loss": 0.7359, "learning_rate": 4.158482637793667e-05, "epoch": 0.26905829596412556, "percentage": 26.91, "elapsed_time": "4:53:38", "remaining_time": "13:17:30", "throughput": 1130.86, "total_tokens": 19924448}
{"current_steps": 635, "total_steps": 2341, "loss": 0.6531, "learning_rate": 4.145893266354944e-05, "epoch": 0.27119367926542814, "percentage": 27.13, "elapsed_time": "4:55:55", "remaining_time": "13:15:03", "throughput": 1130.77, "total_tokens": 20077888}
{"current_steps": 640, "total_steps": 2341, "loss": 0.5728, "learning_rate": 4.133229791715685e-05, "epoch": 0.27332906256673073, "percentage": 27.34, "elapsed_time": "4:58:05", "remaining_time": "13:12:17", "throughput": 1130.69, "total_tokens": 20223296}
{"current_steps": 645, "total_steps": 2341, "loss": 0.7355, "learning_rate": 4.1204927840246455e-05, "epoch": 0.2754644458680333, "percentage": 27.55, "elapsed_time": "5:00:01", "remaining_time": "13:08:54", "throughput": 1130.62, "total_tokens": 20352928}
{"current_steps": 650, "total_steps": 2341, "loss": 0.6645, "learning_rate": 4.1076828167412683e-05, "epoch": 0.2775998291693359, "percentage": 27.77, "elapsed_time": "5:02:21", "remaining_time": "13:06:35", "throughput": 1130.64, "total_tokens": 20511232}
{"current_steps": 655, "total_steps": 2341, "loss": 0.5866, "learning_rate": 4.0948004666098625e-05, "epoch": 0.2797352124706385, "percentage": 27.98, "elapsed_time": "5:04:51", "remaining_time": "13:04:44", "throughput": 1130.77, "total_tokens": 20684032}
{"current_steps": 660, "total_steps": 2341, "loss": 0.6235, "learning_rate": 4.081846313633637e-05, "epoch": 0.28187059577194107, "percentage": 28.19, "elapsed_time": "5:06:59", "remaining_time": "13:01:54", "throughput": 1130.64, "total_tokens": 20826176}
{"current_steps": 665, "total_steps": 2341, "loss": 0.6974, "learning_rate": 4.068820941048587e-05, "epoch": 0.28400597907324365, "percentage": 28.41, "elapsed_time": "5:09:38", "remaining_time": "13:00:24", "throughput": 1130.71, "total_tokens": 21007264}
{"current_steps": 670, "total_steps": 2341, "loss": 0.6629, "learning_rate": 4.0557249352972316e-05, "epoch": 0.28614136237454624, "percentage": 28.62, "elapsed_time": "5:11:43", "remaining_time": "12:57:27", "throughput": 1130.52, "total_tokens": 21145024}
{"current_steps": 675, "total_steps": 2341, "loss": 0.7321, "learning_rate": 4.0425588860022166e-05, "epoch": 0.2882767456758488, "percentage": 28.83, "elapsed_time": "5:13:56", "remaining_time": "12:54:50", "throughput": 1130.54, "total_tokens": 21295104}
{"current_steps": 680, "total_steps": 2341, "loss": 0.6325, "learning_rate": 4.029323385939763e-05, "epoch": 0.2904121289771514, "percentage": 29.05, "elapsed_time": "5:16:05", "remaining_time": "12:52:05", "throughput": 1130.5, "total_tokens": 21440256}
{"current_steps": 685, "total_steps": 2341, "loss": 0.6882, "learning_rate": 4.0160190310129806e-05, "epoch": 0.292547512278454, "percentage": 29.26, "elapsed_time": "5:18:20", "remaining_time": "12:49:36", "throughput": 1130.48, "total_tokens": 21592768}
{"current_steps": 690, "total_steps": 2341, "loss": 0.659, "learning_rate": 4.0026464202250375e-05, "epoch": 0.2946828955797566, "percentage": 29.47, "elapsed_time": "5:20:50", "remaining_time": "12:47:41", "throughput": 1130.55, "total_tokens": 21763360}
{"current_steps": 695, "total_steps": 2341, "loss": 0.6757, "learning_rate": 3.989206155652192e-05, "epoch": 0.29681827888105916, "percentage": 29.69, "elapsed_time": "5:23:05", "remaining_time": "12:45:12", "throughput": 1130.6, "total_tokens": 21917792}
{"current_steps": 700, "total_steps": 2341, "loss": 0.6238, "learning_rate": 3.975698842416684e-05, "epoch": 0.29895366218236175, "percentage": 29.9, "elapsed_time": "5:25:07", "remaining_time": "12:42:11", "throughput": 1130.44, "total_tokens": 22052384}
{"current_steps": 705, "total_steps": 2341, "loss": 0.688, "learning_rate": 3.962125088659492e-05, "epoch": 0.30108904548366433, "percentage": 30.12, "elapsed_time": "5:27:41", "remaining_time": "12:40:25", "throughput": 1130.42, "total_tokens": 22225568}
{"current_steps": 710, "total_steps": 2341, "loss": 0.7123, "learning_rate": 3.948485505512953e-05, "epoch": 0.3032244287849669, "percentage": 30.33, "elapsed_time": "5:30:04", "remaining_time": "12:38:13", "throughput": 1130.48, "total_tokens": 22388160}
{"current_steps": 715, "total_steps": 2341, "loss": 0.6638, "learning_rate": 3.9347807070732444e-05, "epoch": 0.3053598120862695, "percentage": 30.54, "elapsed_time": "5:32:50", "remaining_time": "12:36:56", "throughput": 1130.64, "total_tokens": 22579936}
{"current_steps": 720, "total_steps": 2341, "loss": 0.7064, "learning_rate": 3.921011310372739e-05, "epoch": 0.3074951953875721, "percentage": 30.76, "elapsed_time": "5:35:03", "remaining_time": "12:34:20", "throughput": 1130.66, "total_tokens": 22730048}
{"current_steps": 725, "total_steps": 2341, "loss": 0.5651, "learning_rate": 3.907177935352223e-05, "epoch": 0.30963057868887467, "percentage": 30.97, "elapsed_time": "5:37:41", "remaining_time": "12:32:42", "throughput": 1130.77, "total_tokens": 22911168}
{"current_steps": 730, "total_steps": 2341, "loss": 0.6695, "learning_rate": 3.893281204832984e-05, "epoch": 0.31176596199017725, "percentage": 31.18, "elapsed_time": "5:40:17", "remaining_time": "12:30:58", "throughput": 1130.79, "total_tokens": 23088096}
{"current_steps": 735, "total_steps": 2341, "loss": 0.5989, "learning_rate": 3.87932174448877e-05, "epoch": 0.31390134529147984, "percentage": 31.4, "elapsed_time": "5:42:37", "remaining_time": "12:28:38", "throughput": 1130.66, "total_tokens": 23243616}
{"current_steps": 740, "total_steps": 2341, "loss": 0.5707, "learning_rate": 3.8653001828176185e-05, "epoch": 0.3160367285927824, "percentage": 31.61, "elapsed_time": "5:44:59", "remaining_time": "12:26:23", "throughput": 1130.58, "total_tokens": 23402240}
{"current_steps": 745, "total_steps": 2341, "loss": 0.6727, "learning_rate": 3.8512171511135616e-05, "epoch": 0.318172111894085, "percentage": 31.82, "elapsed_time": "5:47:26", "remaining_time": "12:24:18", "throughput": 1130.56, "total_tokens": 23568096}
{"current_steps": 750, "total_steps": 2341, "loss": 0.7122, "learning_rate": 3.8370732834382025e-05, "epoch": 0.3203074951953876, "percentage": 32.04, "elapsed_time": "5:49:43", "remaining_time": "12:21:53", "throughput": 1130.59, "total_tokens": 23723968}
{"current_steps": 755, "total_steps": 2341, "loss": 0.6667, "learning_rate": 3.822869216592167e-05, "epoch": 0.3224428784966902, "percentage": 32.25, "elapsed_time": "5:52:03", "remaining_time": "12:19:33", "throughput": 1130.59, "total_tokens": 23882016}
{"current_steps": 760, "total_steps": 2341, "loss": 0.7896, "learning_rate": 3.8086055900864356e-05, "epoch": 0.32457826179799276, "percentage": 32.46, "elapsed_time": "5:54:20", "remaining_time": "12:17:06", "throughput": 1130.62, "total_tokens": 24037088}
{"current_steps": 765, "total_steps": 2341, "loss": 0.6208, "learning_rate": 3.794283046113546e-05, "epoch": 0.32671364509929535, "percentage": 32.68, "elapsed_time": "5:56:29", "remaining_time": "12:14:25", "throughput": 1130.45, "total_tokens": 24180032}
{"current_steps": 770, "total_steps": 2341, "loss": 0.6193, "learning_rate": 3.7799022295186823e-05, "epoch": 0.32884902840059793, "percentage": 32.89, "elapsed_time": "5:59:13", "remaining_time": "12:12:53", "throughput": 1130.38, "total_tokens": 24363168}
{"current_steps": 775, "total_steps": 2341, "loss": 0.6024, "learning_rate": 3.765463787770645e-05, "epoch": 0.3309844117019005, "percentage": 33.11, "elapsed_time": "6:01:35", "remaining_time": "12:10:39", "throughput": 1130.27, "total_tokens": 24522112}
{"current_steps": 780, "total_steps": 2341, "loss": 0.7026, "learning_rate": 3.750968370932694e-05, "epoch": 0.3331197950032031, "percentage": 33.32, "elapsed_time": "6:04:06", "remaining_time": "12:08:41", "throughput": 1130.33, "total_tokens": 24694048}
{"current_steps": 785, "total_steps": 2341, "loss": 0.6094, "learning_rate": 3.736416631633286e-05, "epoch": 0.3352551783045057, "percentage": 33.53, "elapsed_time": "6:06:21", "remaining_time": "12:06:11", "throughput": 1130.37, "total_tokens": 24847616}
{"current_steps": 790, "total_steps": 2341, "loss": 0.6167, "learning_rate": 3.721809225036688e-05, "epoch": 0.33739056160580827, "percentage": 33.75, "elapsed_time": "6:08:31", "remaining_time": "12:03:30", "throughput": 1130.3, "total_tokens": 24992096}
{"current_steps": 795, "total_steps": 2341, "loss": 0.6861, "learning_rate": 3.7071468088134806e-05, "epoch": 0.3395259449071108, "percentage": 33.96, "elapsed_time": "6:10:48", "remaining_time": "12:01:05", "throughput": 1130.23, "total_tokens": 25145792}
{"current_steps": 800, "total_steps": 2341, "loss": 0.8109, "learning_rate": 3.692430043110947e-05, "epoch": 0.3416613282084134, "percentage": 34.17, "elapsed_time": "6:13:16", "remaining_time": "11:59:01", "throughput": 1130.39, "total_tokens": 25316896}
{"current_steps": 805, "total_steps": 2341, "loss": 0.6796, "learning_rate": 3.677659590523354e-05, "epoch": 0.34379671150971597, "percentage": 34.39, "elapsed_time": "6:15:18", "remaining_time": "11:56:07", "throughput": 1130.29, "total_tokens": 25452608}
{"current_steps": 810, "total_steps": 2341, "loss": 0.8018, "learning_rate": 3.662836116062117e-05, "epoch": 0.34593209481101855, "percentage": 34.6, "elapsed_time": "6:17:27", "remaining_time": "11:53:26", "throughput": 1130.25, "total_tokens": 25597056}
{"current_steps": 815, "total_steps": 2341, "loss": 0.7318, "learning_rate": 3.647960287125859e-05, "epoch": 0.34806747811232114, "percentage": 34.81, "elapsed_time": "6:19:53", "remaining_time": "11:51:18", "throughput": 1130.32, "total_tokens": 25764224}
{"current_steps": 820, "total_steps": 2341, "loss": 0.6615, "learning_rate": 3.6330327734703626e-05, "epoch": 0.3502028614136237, "percentage": 35.03, "elapsed_time": "6:21:49", "remaining_time": "11:48:14", "throughput": 1130.26, "total_tokens": 25893824}
{"current_steps": 825, "total_steps": 2341, "loss": 0.6466, "learning_rate": 3.61805424717842e-05, "epoch": 0.3523382447149263, "percentage": 35.24, "elapsed_time": "6:23:54", "remaining_time": "11:45:28", "throughput": 1130.21, "total_tokens": 26034304}
{"current_steps": 830, "total_steps": 2341, "loss": 0.7432, "learning_rate": 3.603025382629565e-05, "epoch": 0.3544736280162289, "percentage": 35.45, "elapsed_time": "6:26:10", "remaining_time": "11:43:01", "throughput": 1130.22, "total_tokens": 26187712}
{"current_steps": 835, "total_steps": 2341, "loss": 0.6275, "learning_rate": 3.58794685646972e-05, "epoch": 0.3566090113175315, "percentage": 35.67, "elapsed_time": "6:28:23", "remaining_time": "11:40:30", "throughput": 1130.2, "total_tokens": 26338080}
{"current_steps": 840, "total_steps": 2341, "loss": 0.6545, "learning_rate": 3.572819347580722e-05, "epoch": 0.35874439461883406, "percentage": 35.88, "elapsed_time": "6:30:48", "remaining_time": "11:38:20", "throughput": 1130.19, "total_tokens": 26501440}
{"current_steps": 845, "total_steps": 2341, "loss": 0.6806, "learning_rate": 3.5576435370497655e-05, "epoch": 0.36087977792013665, "percentage": 36.1, "elapsed_time": "6:33:12", "remaining_time": "11:36:08", "throughput": 1130.19, "total_tokens": 26663936}
{"current_steps": 850, "total_steps": 2341, "loss": 0.6517, "learning_rate": 3.542420108138732e-05, "epoch": 0.36301516122143923, "percentage": 36.31, "elapsed_time": "6:35:42", "remaining_time": "11:34:06", "throughput": 1130.24, "total_tokens": 26834176}
{"current_steps": 855, "total_steps": 2341, "loss": 0.7356, "learning_rate": 3.527149746253431e-05, "epoch": 0.3651505445227418, "percentage": 36.52, "elapsed_time": "6:38:06", "remaining_time": "11:31:54", "throughput": 1130.23, "total_tokens": 26996928}
{"current_steps": 860, "total_steps": 2341, "loss": 0.8021, "learning_rate": 3.511833138912738e-05, "epoch": 0.3672859278240444, "percentage": 36.74, "elapsed_time": "6:40:33", "remaining_time": "11:29:47", "throughput": 1130.2, "total_tokens": 27162304}
{"current_steps": 865, "total_steps": 2341, "loss": 0.7542, "learning_rate": 3.496470975717643e-05, "epoch": 0.369421311125347, "percentage": 36.95, "elapsed_time": "6:42:52", "remaining_time": "11:27:26", "throughput": 1130.2, "total_tokens": 27319392}
{"current_steps": 870, "total_steps": 2341, "loss": 0.6407, "learning_rate": 3.4810639483202015e-05, "epoch": 0.37155669442664957, "percentage": 37.16, "elapsed_time": "6:45:38", "remaining_time": "11:25:51", "throughput": 1130.38, "total_tokens": 27511360}
{"current_steps": 875, "total_steps": 2341, "loss": 0.7553, "learning_rate": 3.465612750392393e-05, "epoch": 0.37369207772795215, "percentage": 37.38, "elapsed_time": "6:48:24", "remaining_time": "11:24:15", "throughput": 1130.55, "total_tokens": 27703488}
{"current_steps": 880, "total_steps": 2341, "loss": 0.6873, "learning_rate": 3.450118077594891e-05, "epoch": 0.37582746102925474, "percentage": 37.59, "elapsed_time": "6:50:47", "remaining_time": "11:22:00", "throughput": 1130.62, "total_tokens": 27866880}
{"current_steps": 885, "total_steps": 2341, "loss": 0.6827, "learning_rate": 3.434580627545743e-05, "epoch": 0.3779628443305573, "percentage": 37.8, "elapsed_time": "6:53:29", "remaining_time": "11:20:16", "throughput": 1130.7, "total_tokens": 28052480}
{"current_steps": 890, "total_steps": 2341, "loss": 0.6143, "learning_rate": 3.419001099788959e-05, "epoch": 0.3800982276318599, "percentage": 38.02, "elapsed_time": "6:56:03", "remaining_time": "11:18:19", "throughput": 1130.81, "total_tokens": 28229600}
{"current_steps": 895, "total_steps": 2341, "loss": 0.5969, "learning_rate": 3.403380195763018e-05, "epoch": 0.3822336109331625, "percentage": 38.23, "elapsed_time": "6:58:27", "remaining_time": "11:16:05", "throughput": 1130.84, "total_tokens": 28392992}
{"current_steps": 900, "total_steps": 2341, "loss": 0.4596, "learning_rate": 3.387718618769287e-05, "epoch": 0.3843689942344651, "percentage": 38.45, "elapsed_time": "7:01:02", "remaining_time": "11:14:08", "throughput": 1130.88, "total_tokens": 28569344}
{"current_steps": 905, "total_steps": 2341, "loss": 0.6412, "learning_rate": 3.372017073940355e-05, "epoch": 0.38650437753576766, "percentage": 38.66, "elapsed_time": "7:03:26", "remaining_time": "11:11:54", "throughput": 1130.9, "total_tokens": 28732608}
{"current_steps": 910, "total_steps": 2341, "loss": 0.7309, "learning_rate": 3.356276268208289e-05, "epoch": 0.38863976083707025, "percentage": 38.87, "elapsed_time": "7:05:41", "remaining_time": "11:09:24", "throughput": 1130.94, "total_tokens": 28885792}
{"current_steps": 915, "total_steps": 2341, "loss": 0.5964, "learning_rate": 3.340496910272798e-05, "epoch": 0.39077514413837283, "percentage": 39.09, "elapsed_time": "7:07:45", "remaining_time": "11:06:38", "throughput": 1130.84, "total_tokens": 29023008}
{"current_steps": 920, "total_steps": 2341, "loss": 0.6368, "learning_rate": 3.324679710569334e-05, "epoch": 0.3929105274396754, "percentage": 39.3, "elapsed_time": "7:09:53", "remaining_time": "11:04:00", "throughput": 1130.8, "total_tokens": 29167584}
{"current_steps": 925, "total_steps": 2341, "loss": 0.626, "learning_rate": 3.308825381237103e-05, "epoch": 0.395045910740978, "percentage": 39.51, "elapsed_time": "7:12:11", "remaining_time": "11:01:36", "throughput": 1130.78, "total_tokens": 29322720}
{"current_steps": 930, "total_steps": 2341, "loss": 0.8989, "learning_rate": 3.292934636086998e-05, "epoch": 0.3971812940422806, "percentage": 39.73, "elapsed_time": "7:14:34", "remaining_time": "10:59:20", "throughput": 1130.87, "total_tokens": 29487200}
{"current_steps": 935, "total_steps": 2341, "loss": 0.7116, "learning_rate": 3.2770081905694696e-05, "epoch": 0.39931667734358317, "percentage": 39.94, "elapsed_time": "7:16:59", "remaining_time": "10:57:07", "throughput": 1130.88, "total_tokens": 29651232}
{"current_steps": 940, "total_steps": 2341, "loss": 0.7665, "learning_rate": 3.261046761742305e-05, "epoch": 0.40145206064488576, "percentage": 40.15, "elapsed_time": "7:19:14", "remaining_time": "10:54:39", "throughput": 1130.95, "total_tokens": 29805216}
{"current_steps": 945, "total_steps": 2341, "loss": 0.6187, "learning_rate": 3.245051068238348e-05, "epoch": 0.40358744394618834, "percentage": 40.37, "elapsed_time": "7:21:36", "remaining_time": "10:52:21", "throughput": 1131.0, "total_tokens": 29967360}
{"current_steps": 950, "total_steps": 2341, "loss": 0.7386, "learning_rate": 3.229021830233149e-05, "epoch": 0.4057228272474909, "percentage": 40.58, "elapsed_time": "7:23:54", "remaining_time": "10:49:57", "throughput": 1131.0, "total_tokens": 30123104}
{"current_steps": 955, "total_steps": 2341, "loss": 0.7952, "learning_rate": 3.2129597694125296e-05, "epoch": 0.4078582105487935, "percentage": 40.79, "elapsed_time": "7:26:29", "remaining_time": "10:48:00", "throughput": 1131.1, "total_tokens": 30302240}
{"current_steps": 960, "total_steps": 2341, "loss": 0.6779, "learning_rate": 3.1968656089401e-05, "epoch": 0.4099935938500961, "percentage": 41.01, "elapsed_time": "7:28:37", "remaining_time": "10:45:22", "throughput": 1131.05, "total_tokens": 30445184}
{"current_steps": 965, "total_steps": 2341, "loss": 0.5771, "learning_rate": 3.180740073424693e-05, "epoch": 0.4121289771513987, "percentage": 41.22, "elapsed_time": "7:30:52", "remaining_time": "10:42:54", "throughput": 1130.99, "total_tokens": 30596384}
{"current_steps": 970, "total_steps": 2341, "loss": 0.6306, "learning_rate": 3.164583888887746e-05, "epoch": 0.41426436045270126, "percentage": 41.44, "elapsed_time": "7:33:32", "remaining_time": "10:41:01", "throughput": 1131.06, "total_tokens": 30778592}
{"current_steps": 975, "total_steps": 2341, "loss": 0.693, "learning_rate": 3.1483977827306054e-05, "epoch": 0.41639974375400385, "percentage": 41.65, "elapsed_time": "7:35:56", "remaining_time": "10:38:47", "throughput": 1131.11, "total_tokens": 30943360}
{"current_steps": 980, "total_steps": 2341, "loss": 0.5558, "learning_rate": 3.1321824837017875e-05, "epoch": 0.41853512705530643, "percentage": 41.86, "elapsed_time": "7:37:45", "remaining_time": "10:35:43", "throughput": 1130.96, "total_tokens": 31062304}
{"current_steps": 985, "total_steps": 2341, "loss": 0.7323, "learning_rate": 3.1159387218641575e-05, "epoch": 0.420670510356609, "percentage": 42.08, "elapsed_time": "7:40:15", "remaining_time": "10:33:37", "throughput": 1131.02, "total_tokens": 31233792}
{"current_steps": 990, "total_steps": 2341, "loss": 0.6371, "learning_rate": 3.099667228562064e-05, "epoch": 0.4228058936579116, "percentage": 42.29, "elapsed_time": "7:42:29", "remaining_time": "10:31:08", "throughput": 1130.96, "total_tokens": 31383616}
{"current_steps": 995, "total_steps": 2341, "loss": 0.6631, "learning_rate": 3.083368736388414e-05, "epoch": 0.4249412769592142, "percentage": 42.5, "elapsed_time": "7:45:03", "remaining_time": "10:29:06", "throughput": 1131.04, "total_tokens": 31559968}
{"current_steps": 1000, "total_steps": 2341, "loss": 0.6021, "learning_rate": 3.067043979151687e-05, "epoch": 0.42707666026051677, "percentage": 42.72, "elapsed_time": "7:47:22", "remaining_time": "10:26:45", "throughput": 1131.01, "total_tokens": 31716480}
{"current_steps": 1005, "total_steps": 2341, "loss": 0.5901, "learning_rate": 3.0506936918428947e-05, "epoch": 0.42921204356181936, "percentage": 42.93, "elapsed_time": "7:49:31", "remaining_time": "10:24:09", "throughput": 1131.0, "total_tokens": 31861568}
{"current_steps": 1010, "total_steps": 2341, "loss": 0.5969, "learning_rate": 3.0343186106024946e-05, "epoch": 0.43134742686312194, "percentage": 43.14, "elapsed_time": "7:51:54", "remaining_time": "10:21:53", "throughput": 1130.98, "total_tokens": 32023008}
{"current_steps": 1015, "total_steps": 2341, "loss": 0.6469, "learning_rate": 3.01791947268724e-05, "epoch": 0.4334828101644245, "percentage": 43.36, "elapsed_time": "7:54:38", "remaining_time": "10:20:04", "throughput": 1131.15, "total_tokens": 32213024}
{"current_steps": 1020, "total_steps": 2341, "loss": 0.6257, "learning_rate": 3.0014970164369936e-05, "epoch": 0.4356181934657271, "percentage": 43.57, "elapsed_time": "7:57:07", "remaining_time": "10:17:55", "throughput": 1131.17, "total_tokens": 32382752}
{"current_steps": 1025, "total_steps": 2341, "loss": 0.7496, "learning_rate": 2.985051981241479e-05, "epoch": 0.4377535767670297, "percentage": 43.78, "elapsed_time": "7:59:11", "remaining_time": "10:15:14", "throughput": 1131.1, "total_tokens": 32520832}
{"current_steps": 1030, "total_steps": 2341, "loss": 0.8778, "learning_rate": 2.9685851075069954e-05, "epoch": 0.4398889600683323, "percentage": 44.0, "elapsed_time": "8:01:26", "remaining_time": "10:12:47", "throughput": 1131.1, "total_tokens": 32673472}
{"current_steps": 1035, "total_steps": 2341, "loss": 0.7424, "learning_rate": 2.9520971366230783e-05, "epoch": 0.44202434336963486, "percentage": 44.21, "elapsed_time": "8:04:00", "remaining_time": "10:10:44", "throughput": 1131.19, "total_tokens": 32850272}
{"current_steps": 1040, "total_steps": 2341, "loss": 0.8948, "learning_rate": 2.9355888109291247e-05, "epoch": 0.44415972667093745, "percentage": 44.43, "elapsed_time": "8:06:09", "remaining_time": "10:08:09", "throughput": 1131.14, "total_tokens": 32994432}
{"current_steps": 1045, "total_steps": 2341, "loss": 0.6752, "learning_rate": 2.9190608736809664e-05, "epoch": 0.44629510997224003, "percentage": 44.64, "elapsed_time": "8:08:14", "remaining_time": "10:05:31", "throughput": 1131.06, "total_tokens": 33134112}
{"current_steps": 1050, "total_steps": 2341, "loss": 0.8079, "learning_rate": 2.902514069017409e-05, "epoch": 0.4484304932735426, "percentage": 44.85, "elapsed_time": "8:10:47", "remaining_time": "10:03:25", "throughput": 1131.08, "total_tokens": 33307008}
{"current_steps": 1055, "total_steps": 2341, "loss": 0.6908, "learning_rate": 2.8859491419267264e-05, "epoch": 0.4505658765748452, "percentage": 45.07, "elapsed_time": "8:13:18", "remaining_time": "10:01:19", "throughput": 1131.09, "total_tokens": 33478752}
{"current_steps": 1060, "total_steps": 2341, "loss": 0.6369, "learning_rate": 2.86936683821312e-05, "epoch": 0.4527012598761478, "percentage": 45.28, "elapsed_time": "8:15:41", "remaining_time": "9:59:02", "throughput": 1131.12, "total_tokens": 33641728}
{"current_steps": 1065, "total_steps": 2341, "loss": 0.6272, "learning_rate": 2.8527679044631417e-05, "epoch": 0.4548366431774504, "percentage": 45.49, "elapsed_time": "8:18:17", "remaining_time": "9:57:00", "throughput": 1131.19, "total_tokens": 33819104}
{"current_steps": 1070, "total_steps": 2341, "loss": 0.5017, "learning_rate": 2.836153088012078e-05, "epoch": 0.45697202647875296, "percentage": 45.71, "elapsed_time": "8:20:12", "remaining_time": "9:54:10", "throughput": 1131.08, "total_tokens": 33946336}
{"current_steps": 1075, "total_steps": 2341, "loss": 0.5854, "learning_rate": 2.8195231369103042e-05, "epoch": 0.45910740978005554, "percentage": 45.92, "elapsed_time": "8:22:36", "remaining_time": "9:51:54", "throughput": 1131.15, "total_tokens": 34111232}
{"current_steps": 1080, "total_steps": 2341, "loss": 0.5877, "learning_rate": 2.802878799889605e-05, "epoch": 0.4612427930813581, "percentage": 46.13, "elapsed_time": "8:24:55", "remaining_time": "9:49:32", "throughput": 1131.18, "total_tokens": 34269536}
{"current_steps": 1085, "total_steps": 2341, "loss": 0.7302, "learning_rate": 2.786220826329462e-05, "epoch": 0.4633781763826607, "percentage": 46.35, "elapsed_time": "8:27:08", "remaining_time": "9:47:04", "throughput": 1131.17, "total_tokens": 34420224}
{"current_steps": 1090, "total_steps": 2341, "loss": 0.9365, "learning_rate": 2.7695499662233164e-05, "epoch": 0.4655135596839633, "percentage": 46.56, "elapsed_time": "8:29:12", "remaining_time": "9:44:25", "throughput": 1131.15, "total_tokens": 34559872}
{"current_steps": 1095, "total_steps": 2341, "loss": 0.6596, "learning_rate": 2.752866970144803e-05, "epoch": 0.4676489429852659, "percentage": 46.77, "elapsed_time": "8:31:45", "remaining_time": "9:42:20", "throughput": 1131.2, "total_tokens": 34734400}
{"current_steps": 1100, "total_steps": 2341, "loss": 0.7114, "learning_rate": 2.7361725892139533e-05, "epoch": 0.46978432628656847, "percentage": 46.99, "elapsed_time": "8:34:01", "remaining_time": "9:39:55", "throughput": 1131.21, "total_tokens": 34888416}
{"current_steps": 1105, "total_steps": 2341, "loss": 0.5746, "learning_rate": 2.719467575063382e-05, "epoch": 0.47191970958787105, "percentage": 47.2, "elapsed_time": "8:36:01", "remaining_time": "9:37:11", "throughput": 1131.12, "total_tokens": 35020992}
{"current_steps": 1110, "total_steps": 2341, "loss": 0.7177, "learning_rate": 2.7027526798044427e-05, "epoch": 0.4740550928891736, "percentage": 47.42, "elapsed_time": "8:38:51", "remaining_time": "9:35:24", "throughput": 1131.18, "total_tokens": 35215072}
{"current_steps": 1115, "total_steps": 2341, "loss": 0.6877, "learning_rate": 2.6860286559933684e-05, "epoch": 0.47619047619047616, "percentage": 47.63, "elapsed_time": "8:41:18", "remaining_time": "9:33:12", "throughput": 1131.15, "total_tokens": 35380928}
{"current_steps": 1120, "total_steps": 2341, "loss": 0.6099, "learning_rate": 2.6692962565973866e-05, "epoch": 0.47832585949177875, "percentage": 47.84, "elapsed_time": "8:43:40", "remaining_time": "9:30:53", "throughput": 1131.12, "total_tokens": 35540480}
{"current_steps": 1125, "total_steps": 2341, "loss": 0.5757, "learning_rate": 2.652556234960821e-05, "epoch": 0.48046124279308133, "percentage": 48.06, "elapsed_time": "8:46:05", "remaining_time": "9:28:38", "throughput": 1131.12, "total_tokens": 35704256}
{"current_steps": 1130, "total_steps": 2341, "loss": 0.683, "learning_rate": 2.635809344771169e-05, "epoch": 0.4825966260943839, "percentage": 48.27, "elapsed_time": "8:48:21", "remaining_time": "9:26:14", "throughput": 1131.06, "total_tokens": 35856608}
{"current_steps": 1135, "total_steps": 2341, "loss": 0.6502, "learning_rate": 2.619056340025175e-05, "epoch": 0.4847320093956865, "percentage": 48.48, "elapsed_time": "8:50:30", "remaining_time": "9:23:41", "throughput": 1131.0, "total_tokens": 35999840}
{"current_steps": 1140, "total_steps": 2341, "loss": 0.6337, "learning_rate": 2.6022979749948783e-05, "epoch": 0.4868673926969891, "percentage": 48.7, "elapsed_time": "8:52:27", "remaining_time": "9:20:57", "throughput": 1130.89, "total_tokens": 36129152}
{"current_steps": 1145, "total_steps": 2341, "loss": 0.7166, "learning_rate": 2.5855350041936537e-05, "epoch": 0.48900277599829167, "percentage": 48.91, "elapsed_time": "8:54:51", "remaining_time": "9:18:40", "throughput": 1130.92, "total_tokens": 36293152}
{"current_steps": 1150, "total_steps": 2341, "loss": 0.7633, "learning_rate": 2.5687681823422445e-05, "epoch": 0.49113815929959426, "percentage": 49.12, "elapsed_time": "8:57:06", "remaining_time": "9:16:15", "throughput": 1130.92, "total_tokens": 36445696}
{"current_steps": 1155, "total_steps": 2341, "loss": 0.6183, "learning_rate": 2.551998264334777e-05, "epoch": 0.49327354260089684, "percentage": 49.34, "elapsed_time": "8:59:35", "remaining_time": "9:14:04", "throughput": 1130.93, "total_tokens": 36614528}
{"current_steps": 1160, "total_steps": 2341, "loss": 0.5267, "learning_rate": 2.5352260052047788e-05, "epoch": 0.4954089259021994, "percentage": 49.55, "elapsed_time": "9:01:40", "remaining_time": "9:11:29", "throughput": 1130.89, "total_tokens": 36754880}
{"current_steps": 1165, "total_steps": 2341, "loss": 0.684, "learning_rate": 2.518452160091181e-05, "epoch": 0.497544309203502, "percentage": 49.77, "elapsed_time": "9:04:13", "remaining_time": "9:09:21", "throughput": 1131.04, "total_tokens": 36932000}
{"current_steps": 1170, "total_steps": 2341, "loss": 0.7886, "learning_rate": 2.5016774842043194e-05, "epoch": 0.4996796925048046, "percentage": 49.98, "elapsed_time": "9:06:35", "remaining_time": "9:07:03", "throughput": 1131.07, "total_tokens": 37093504}
{"current_steps": 1175, "total_steps": 2341, "loss": 0.691, "learning_rate": 2.484902732791936e-05, "epoch": 0.5018150758061072, "percentage": 50.19, "elapsed_time": "9:09:12", "remaining_time": "9:04:59", "throughput": 1131.12, "total_tokens": 37272736}
{"current_steps": 1180, "total_steps": 2341, "loss": 0.7877, "learning_rate": 2.4681286611051708e-05, "epoch": 0.5039504591074098, "percentage": 50.41, "elapsed_time": "9:11:26", "remaining_time": "9:02:33", "throughput": 1131.12, "total_tokens": 37425024}
{"current_steps": 1185, "total_steps": 2341, "loss": 0.6496, "learning_rate": 2.4513560243645635e-05, "epoch": 0.5060858424087123, "percentage": 50.62, "elapsed_time": "9:14:00", "remaining_time": "9:00:27", "throughput": 1131.16, "total_tokens": 37600736}
{"current_steps": 1190, "total_steps": 2341, "loss": 0.6722, "learning_rate": 2.4345855777260462e-05, "epoch": 0.5082212257100149, "percentage": 50.83, "elapsed_time": "9:16:34", "remaining_time": "8:58:19", "throughput": 1131.19, "total_tokens": 37775072}
{"current_steps": 1195, "total_steps": 2341, "loss": 0.6637, "learning_rate": 2.4178180762469447e-05, "epoch": 0.5103566090113175, "percentage": 51.05, "elapsed_time": "9:18:33", "remaining_time": "8:55:39", "throughput": 1131.15, "total_tokens": 37908864}
{"current_steps": 1200, "total_steps": 2341, "loss": 0.6507, "learning_rate": 2.4010542748519863e-05, "epoch": 0.5124919923126201, "percentage": 51.26, "elapsed_time": "9:21:19", "remaining_time": "8:53:44", "throughput": 1131.22, "total_tokens": 38099328}
{"current_steps": 1205, "total_steps": 2341, "loss": 0.8343, "learning_rate": 2.384294928299309e-05, "epoch": 0.5146273756139227, "percentage": 51.47, "elapsed_time": "9:23:31", "remaining_time": "8:51:15", "throughput": 1131.19, "total_tokens": 38247072}
{"current_steps": 1210, "total_steps": 2341, "loss": 0.598, "learning_rate": 2.3675407911464788e-05, "epoch": 0.5167627589152253, "percentage": 51.69, "elapsed_time": "9:25:40", "remaining_time": "8:48:44", "throughput": 1131.12, "total_tokens": 38391168}
{"current_steps": 1215, "total_steps": 2341, "loss": 0.6245, "learning_rate": 2.350792617716521e-05, "epoch": 0.5188981422165279, "percentage": 51.9, "elapsed_time": "9:28:19", "remaining_time": "8:46:41", "throughput": 1131.21, "total_tokens": 38573664}
{"current_steps": 1220, "total_steps": 2341, "loss": 0.72, "learning_rate": 2.334051162063953e-05, "epoch": 0.5210335255178304, "percentage": 52.11, "elapsed_time": "9:30:45", "remaining_time": "8:44:26", "throughput": 1131.26, "total_tokens": 38740672}
{"current_steps": 1225, "total_steps": 2341, "loss": 0.6333, "learning_rate": 2.3173171779408386e-05, "epoch": 0.523168908819133, "percentage": 52.33, "elapsed_time": "9:32:37", "remaining_time": "8:41:40", "throughput": 1131.16, "total_tokens": 38864224}
{"current_steps": 1230, "total_steps": 2341, "loss": 0.7262, "learning_rate": 2.3005914187628492e-05, "epoch": 0.5253042921204356, "percentage": 52.54, "elapsed_time": "9:34:40", "remaining_time": "8:39:04", "throughput": 1131.09, "total_tokens": 39000320}
{"current_steps": 1235, "total_steps": 2341, "loss": 0.5828, "learning_rate": 2.2838746375753456e-05, "epoch": 0.5274396754217382, "percentage": 52.76, "elapsed_time": "9:37:31", "remaining_time": "8:37:11", "throughput": 1131.23, "total_tokens": 39198400}
{"current_steps": 1240, "total_steps": 2341, "loss": 0.6544, "learning_rate": 2.2671675870194677e-05, "epoch": 0.5295750587230408, "percentage": 52.97, "elapsed_time": "9:39:54", "remaining_time": "8:34:53", "throughput": 1131.2, "total_tokens": 39359232}
{"current_steps": 1245, "total_steps": 2341, "loss": 0.6669, "learning_rate": 2.2504710192982575e-05, "epoch": 0.5317104420243434, "percentage": 53.18, "elapsed_time": "9:42:02", "remaining_time": "8:32:22", "throughput": 1131.15, "total_tokens": 39502176}
{"current_steps": 1250, "total_steps": 2341, "loss": 0.8427, "learning_rate": 2.2337856861427843e-05, "epoch": 0.533845825325646, "percentage": 53.4, "elapsed_time": "9:45:09", "remaining_time": "8:30:43", "throughput": 1131.26, "total_tokens": 39717472}
{"current_steps": 1255, "total_steps": 2341, "loss": 0.5687, "learning_rate": 2.2171123387783028e-05, "epoch": 0.5359812086269485, "percentage": 53.61, "elapsed_time": "9:46:58", "remaining_time": "8:27:55", "throughput": 1131.11, "total_tokens": 39836000}
{"current_steps": 1260, "total_steps": 2341, "loss": 0.6957, "learning_rate": 2.2004517278904316e-05, "epoch": 0.5381165919282511, "percentage": 53.82, "elapsed_time": "9:49:18", "remaining_time": "8:25:35", "throughput": 1131.13, "total_tokens": 39995200}
{"current_steps": 1265, "total_steps": 2341, "loss": 0.6944, "learning_rate": 2.183804603591352e-05, "epoch": 0.5402519752295537, "percentage": 54.04, "elapsed_time": "9:51:54", "remaining_time": "8:23:28", "throughput": 1131.18, "total_tokens": 40173280}
{"current_steps": 1270, "total_steps": 2341, "loss": 0.7211, "learning_rate": 2.1671717153860385e-05, "epoch": 0.5423873585308563, "percentage": 54.25, "elapsed_time": "9:54:02", "remaining_time": "8:20:57", "throughput": 1131.11, "total_tokens": 40315296}
{"current_steps": 1275, "total_steps": 2341, "loss": 0.6752, "learning_rate": 2.1505538121385127e-05, "epoch": 0.5445227418321589, "percentage": 54.46, "elapsed_time": "9:56:32", "remaining_time": "8:18:45", "throughput": 1131.13, "total_tokens": 40485504}
{"current_steps": 1280, "total_steps": 2341, "loss": 0.7874, "learning_rate": 2.133951642038127e-05, "epoch": 0.5466581251334615, "percentage": 54.68, "elapsed_time": "9:59:18", "remaining_time": "8:16:46", "throughput": 1131.26, "total_tokens": 40678624}
{"current_steps": 1285, "total_steps": 2341, "loss": 0.6918, "learning_rate": 2.117365952565879e-05, "epoch": 0.548793508434764, "percentage": 54.89, "elapsed_time": "10:01:33", "remaining_time": "8:14:21", "throughput": 1131.2, "total_tokens": 40829472}
{"current_steps": 1290, "total_steps": 2341, "loss": 0.6707, "learning_rate": 2.100797490460756e-05, "epoch": 0.5509288917360666, "percentage": 55.1, "elapsed_time": "10:03:27", "remaining_time": "8:11:39", "throughput": 1131.1, "total_tokens": 40954304}
{"current_steps": 1295, "total_steps": 2341, "loss": 0.6515, "learning_rate": 2.0842470016861184e-05, "epoch": 0.5530642750373692, "percentage": 55.32, "elapsed_time": "10:05:52", "remaining_time": "8:09:22", "throughput": 1131.17, "total_tokens": 41120160}
{"current_steps": 1300, "total_steps": 2341, "loss": 0.7781, "learning_rate": 2.06771523139611e-05, "epoch": 0.5551996583386718, "percentage": 55.53, "elapsed_time": "10:08:18", "remaining_time": "8:07:06", "throughput": 1131.11, "total_tokens": 41283680}
{"current_steps": 1305, "total_steps": 2341, "loss": 0.6262, "learning_rate": 2.051202923902112e-05, "epoch": 0.5573350416399744, "percentage": 55.75, "elapsed_time": "10:10:18", "remaining_time": "8:04:30", "throughput": 1131.03, "total_tokens": 41416448}
{"current_steps": 1310, "total_steps": 2341, "loss": 0.5474, "learning_rate": 2.0347108226392285e-05, "epoch": 0.559470424941277, "percentage": 55.96, "elapsed_time": "10:12:30", "remaining_time": "8:02:03", "throughput": 1130.97, "total_tokens": 41563552}
{"current_steps": 1315, "total_steps": 2341, "loss": 0.7023, "learning_rate": 2.0182396701328187e-05, "epoch": 0.5616058082425796, "percentage": 56.17, "elapsed_time": "10:14:42", "remaining_time": "7:59:36", "throughput": 1130.99, "total_tokens": 41713152}
{"current_steps": 1320, "total_steps": 2341, "loss": 0.8375, "learning_rate": 2.001790207965062e-05, "epoch": 0.5637411915438821, "percentage": 56.39, "elapsed_time": "10:17:25", "remaining_time": "7:57:33", "throughput": 1131.09, "total_tokens": 41901728}
{"current_steps": 1325, "total_steps": 2341, "loss": 0.7857, "learning_rate": 1.9853631767415737e-05, "epoch": 0.5658765748451847, "percentage": 56.6, "elapsed_time": "10:19:22", "remaining_time": "7:54:55", "throughput": 1131.03, "total_tokens": 42031776}
{"current_steps": 1330, "total_steps": 2341, "loss": 0.7697, "learning_rate": 1.9689593160580577e-05, "epoch": 0.5680119581464873, "percentage": 56.81, "elapsed_time": "10:21:48", "remaining_time": "7:52:39", "throughput": 1131.02, "total_tokens": 42196352}
{"current_steps": 1335, "total_steps": 2341, "loss": 0.8586, "learning_rate": 1.9525793644670094e-05, "epoch": 0.5701473414477899, "percentage": 57.03, "elapsed_time": "10:23:57", "remaining_time": "7:50:11", "throughput": 1130.99, "total_tokens": 42341088}
{"current_steps": 1340, "total_steps": 2341, "loss": 0.8365, "learning_rate": 1.93622405944446e-05, "epoch": 0.5722827247490925, "percentage": 57.24, "elapsed_time": "10:26:12", "remaining_time": "7:47:47", "throughput": 1131.02, "total_tokens": 42495424}
{"current_steps": 1345, "total_steps": 2341, "loss": 0.6521, "learning_rate": 1.9198941373567797e-05, "epoch": 0.5744181080503951, "percentage": 57.45, "elapsed_time": "10:28:07", "remaining_time": "7:45:08", "throughput": 1130.93, "total_tokens": 42622080}
{"current_steps": 1350, "total_steps": 2341, "loss": 0.8343, "learning_rate": 1.9035903334275186e-05, "epoch": 0.5765534913516976, "percentage": 57.67, "elapsed_time": "10:30:57", "remaining_time": "7:43:10", "throughput": 1131.01, "total_tokens": 42817472}
{"current_steps": 1355, "total_steps": 2341, "loss": 0.6469, "learning_rate": 1.887313381704308e-05, "epoch": 0.5786888746530002, "percentage": 57.88, "elapsed_time": "10:33:10", "remaining_time": "7:40:44", "throughput": 1131.01, "total_tokens": 42967968}
{"current_steps": 1360, "total_steps": 2341, "loss": 0.6199, "learning_rate": 1.871064015025808e-05, "epoch": 0.5808242579543028, "percentage": 58.09, "elapsed_time": "10:35:19", "remaining_time": "7:38:16", "throughput": 1130.99, "total_tokens": 43113120}
{"current_steps": 1365, "total_steps": 2341, "loss": 0.6748, "learning_rate": 1.8548429649887167e-05, "epoch": 0.5829596412556054, "percentage": 58.31, "elapsed_time": "10:38:13", "remaining_time": "7:36:20", "throughput": 1131.04, "total_tokens": 43311584}
{"current_steps": 1370, "total_steps": 2341, "loss": 0.6825, "learning_rate": 1.8386509619148283e-05, "epoch": 0.585095024556908, "percentage": 58.52, "elapsed_time": "10:40:32", "remaining_time": "7:33:59", "throughput": 1131.03, "total_tokens": 43468704}
{"current_steps": 1375, "total_steps": 2341, "loss": 0.7961, "learning_rate": 1.822488734818153e-05, "epoch": 0.5872304078582106, "percentage": 58.74, "elapsed_time": "10:42:53", "remaining_time": "7:31:39", "throughput": 1131.07, "total_tokens": 43629152}
{"current_steps": 1380, "total_steps": 2341, "loss": 0.7024, "learning_rate": 1.8063570113720955e-05, "epoch": 0.5893657911595132, "percentage": 58.95, "elapsed_time": "10:45:21", "remaining_time": "7:29:24", "throughput": 1131.07, "total_tokens": 43796384}
{"current_steps": 1385, "total_steps": 2341, "loss": 0.7315, "learning_rate": 1.79025651787669e-05, "epoch": 0.5915011744608157, "percentage": 59.16, "elapsed_time": "10:47:54", "remaining_time": "7:27:13", "throughput": 1131.14, "total_tokens": 43972640}
{"current_steps": 1390, "total_steps": 2341, "loss": 0.7955, "learning_rate": 1.7741879792259033e-05, "epoch": 0.5936365577621183, "percentage": 59.38, "elapsed_time": "10:49:55", "remaining_time": "7:24:39", "throughput": 1131.15, "total_tokens": 44110080}
{"current_steps": 1395, "total_steps": 2341, "loss": 0.8156, "learning_rate": 1.7581521188749968e-05, "epoch": 0.5957719410634209, "percentage": 59.59, "elapsed_time": "10:52:17", "remaining_time": "7:22:20", "throughput": 1131.14, "total_tokens": 44270080}
{"current_steps": 1400, "total_steps": 2341, "loss": 0.688, "learning_rate": 1.742149658807952e-05, "epoch": 0.5979073243647235, "percentage": 59.8, "elapsed_time": "10:54:44", "remaining_time": "7:20:05", "throughput": 1131.16, "total_tokens": 44437280}
{"current_steps": 1405, "total_steps": 2341, "loss": 0.7067, "learning_rate": 1.7261813195049682e-05, "epoch": 0.6000427076660261, "percentage": 60.02, "elapsed_time": "10:56:51", "remaining_time": "7:17:35", "throughput": 1131.14, "total_tokens": 44579680}
{"current_steps": 1410, "total_steps": 2341, "loss": 0.565, "learning_rate": 1.7102478199100218e-05, "epoch": 0.6021780909673287, "percentage": 60.23, "elapsed_time": "10:59:52", "remaining_time": "7:15:42", "throughput": 1131.24, "total_tokens": 44788832}
{"current_steps": 1415, "total_steps": 2341, "loss": 0.5555, "learning_rate": 1.6943498773984974e-05, "epoch": 0.6043134742686312, "percentage": 60.44, "elapsed_time": "11:02:18", "remaining_time": "7:13:25", "throughput": 1131.19, "total_tokens": 44951488}
{"current_steps": 1420, "total_steps": 2341, "loss": 0.7106, "learning_rate": 1.678488207744891e-05, "epoch": 0.6064488575699338, "percentage": 60.66, "elapsed_time": "11:04:50", "remaining_time": "7:11:12", "throughput": 1131.28, "total_tokens": 45127232}
{"current_steps": 1425, "total_steps": 2341, "loss": 0.8088, "learning_rate": 1.6626635250905813e-05, "epoch": 0.6085842408712364, "percentage": 60.87, "elapsed_time": "11:07:13", "remaining_time": "7:08:53", "throughput": 1131.32, "total_tokens": 45290592}
{"current_steps": 1430, "total_steps": 2341, "loss": 0.5566, "learning_rate": 1.646876541911679e-05, "epoch": 0.610719624172539, "percentage": 61.09, "elapsed_time": "11:09:19", "remaining_time": "7:06:23", "throughput": 1131.25, "total_tokens": 45429920}
{"current_steps": 1435, "total_steps": 2341, "loss": 0.6124, "learning_rate": 1.6311279689869464e-05, "epoch": 0.6128550074738416, "percentage": 61.3, "elapsed_time": "11:11:57", "remaining_time": "7:04:14", "throughput": 1131.33, "total_tokens": 45612000}
{"current_steps": 1440, "total_steps": 2341, "loss": 0.764, "learning_rate": 1.615418515365799e-05, "epoch": 0.6149903907751442, "percentage": 61.51, "elapsed_time": "11:14:03", "remaining_time": "7:01:45", "throughput": 1131.27, "total_tokens": 45752192}
{"current_steps": 1445, "total_steps": 2341, "loss": 0.6346, "learning_rate": 1.5997488883363804e-05, "epoch": 0.6171257740764468, "percentage": 61.73, "elapsed_time": "11:16:35", "remaining_time": "6:59:31", "throughput": 1131.36, "total_tokens": 45927808}
{"current_steps": 1450, "total_steps": 2341, "loss": 0.5827, "learning_rate": 1.5841197933937164e-05, "epoch": 0.6192611573777493, "percentage": 61.94, "elapsed_time": "11:18:52", "remaining_time": "6:57:09", "throughput": 1131.33, "total_tokens": 46082432}
{"current_steps": 1455, "total_steps": 2341, "loss": 0.6316, "learning_rate": 1.568531934207955e-05, "epoch": 0.6213965406790519, "percentage": 62.15, "elapsed_time": "11:21:00", "remaining_time": "6:54:41", "throughput": 1131.33, "total_tokens": 46226688}
{"current_steps": 1460, "total_steps": 2341, "loss": 0.7383, "learning_rate": 1.552986012592681e-05, "epoch": 0.6235319239803545, "percentage": 62.37, "elapsed_time": "11:23:00", "remaining_time": "6:52:08", "throughput": 1131.3, "total_tokens": 46361216}
{"current_steps": 1465, "total_steps": 2341, "loss": 0.598, "learning_rate": 1.5374827284733223e-05, "epoch": 0.6256673072816571, "percentage": 62.58, "elapsed_time": "11:25:15", "remaining_time": "6:49:45", "throughput": 1131.25, "total_tokens": 46511840}
{"current_steps": 1470, "total_steps": 2341, "loss": 0.6047, "learning_rate": 1.5220227798556333e-05, "epoch": 0.6278026905829597, "percentage": 62.79, "elapsed_time": "11:27:06", "remaining_time": "6:47:07", "throughput": 1131.19, "total_tokens": 46635328}
{"current_steps": 1475, "total_steps": 2341, "loss": 0.5981, "learning_rate": 1.5066068627942714e-05, "epoch": 0.6299380738842623, "percentage": 63.01, "elapsed_time": "11:29:24", "remaining_time": "6:44:45", "throughput": 1131.2, "total_tokens": 46791520}
{"current_steps": 1480, "total_steps": 2341, "loss": 0.9216, "learning_rate": 1.4912356713614573e-05, "epoch": 0.6320734571855648, "percentage": 63.22, "elapsed_time": "11:31:55", "remaining_time": "6:42:32", "throughput": 1131.25, "total_tokens": 46964672}
{"current_steps": 1485, "total_steps": 2341, "loss": 0.7327, "learning_rate": 1.4759098976157227e-05, "epoch": 0.6342088404868674, "percentage": 63.43, "elapsed_time": "11:34:10", "remaining_time": "6:40:08", "throughput": 1131.25, "total_tokens": 47116864}
{"current_steps": 1490, "total_steps": 2341, "loss": 0.6273, "learning_rate": 1.4606302315707587e-05, "epoch": 0.63634422378817, "percentage": 63.65, "elapsed_time": "11:36:10", "remaining_time": "6:37:37", "throughput": 1131.16, "total_tokens": 47249824}
{"current_steps": 1495, "total_steps": 2341, "loss": 0.6039, "learning_rate": 1.4453973611643445e-05, "epoch": 0.6384796070894726, "percentage": 63.86, "elapsed_time": "11:38:28", "remaining_time": "6:35:15", "throughput": 1131.15, "total_tokens": 47405440}
{"current_steps": 1500, "total_steps": 2341, "loss": 0.6372, "learning_rate": 1.4302119722273727e-05, "epoch": 0.6406149903907752, "percentage": 64.08, "elapsed_time": "11:40:46", "remaining_time": "6:32:53", "throughput": 1131.16, "total_tokens": 47560960}
{"current_steps": 1505, "total_steps": 2341, "loss": 0.5995, "learning_rate": 1.4150747484529758e-05, "epoch": 0.6427503736920778, "percentage": 64.29, "elapsed_time": "11:43:14", "remaining_time": "6:30:38", "throughput": 1131.11, "total_tokens": 47726656}
{"current_steps": 1510, "total_steps": 2341, "loss": 0.7475, "learning_rate": 1.3999863713657405e-05, "epoch": 0.6448857569933804, "percentage": 64.5, "elapsed_time": "11:45:32", "remaining_time": "6:28:16", "throughput": 1131.12, "total_tokens": 47882784}
{"current_steps": 1515, "total_steps": 2341, "loss": 0.7008, "learning_rate": 1.3849475202910244e-05, "epoch": 0.6470211402946829, "percentage": 64.72, "elapsed_time": "11:47:58", "remaining_time": "6:25:59", "throughput": 1131.14, "total_tokens": 48048608}
{"current_steps": 1520, "total_steps": 2341, "loss": 0.5906, "learning_rate": 1.369958872324374e-05, "epoch": 0.6491565235959855, "percentage": 64.93, "elapsed_time": "11:49:48", "remaining_time": "6:23:23", "throughput": 1131.0, "total_tokens": 48167424}
{"current_steps": 1525, "total_steps": 2341, "loss": 0.7876, "learning_rate": 1.3550211023010346e-05, "epoch": 0.6512919068972881, "percentage": 65.14, "elapsed_time": "11:52:20", "remaining_time": "6:21:09", "throughput": 1131.06, "total_tokens": 48342048}
{"current_steps": 1530, "total_steps": 2341, "loss": 0.6946, "learning_rate": 1.3401348827655665e-05, "epoch": 0.6534272901985907, "percentage": 65.36, "elapsed_time": "11:54:54", "remaining_time": "6:18:57", "throughput": 1131.13, "total_tokens": 48519488}
{"current_steps": 1535, "total_steps": 2341, "loss": 0.661, "learning_rate": 1.3253008839415726e-05, "epoch": 0.6555626734998933, "percentage": 65.57, "elapsed_time": "11:57:08", "remaining_time": "6:16:33", "throughput": 1131.14, "total_tokens": 48671424}
{"current_steps": 1540, "total_steps": 2341, "loss": 0.6125, "learning_rate": 1.310519773701515e-05, "epoch": 0.6576980568011959, "percentage": 65.78, "elapsed_time": "11:59:04", "remaining_time": "6:14:00", "throughput": 1131.0, "total_tokens": 48796000}
{"current_steps": 1545, "total_steps": 2341, "loss": 0.6231, "learning_rate": 1.2957922175366493e-05, "epoch": 0.6598334401024984, "percentage": 66.0, "elapsed_time": "12:01:39", "remaining_time": "6:11:48", "throughput": 1131.03, "total_tokens": 48973024}
{"current_steps": 1550, "total_steps": 2341, "loss": 0.836, "learning_rate": 1.2811188785270617e-05, "epoch": 0.661968823403801, "percentage": 66.21, "elapsed_time": "12:04:04", "remaining_time": "6:09:30", "throughput": 1131.09, "total_tokens": 49140192}
{"current_steps": 1555, "total_steps": 2341, "loss": 0.6581, "learning_rate": 1.2665004173118136e-05, "epoch": 0.6641042067051036, "percentage": 66.42, "elapsed_time": "12:06:36", "remaining_time": "6:07:16", "throughput": 1131.14, "total_tokens": 49313920}
{"current_steps": 1560, "total_steps": 2341, "loss": 0.6878, "learning_rate": 1.2519374920591987e-05, "epoch": 0.6662395900064062, "percentage": 66.64, "elapsed_time": "12:09:02", "remaining_time": "6:04:59", "throughput": 1131.16, "total_tokens": 49480096}
{"current_steps": 1565, "total_steps": 2341, "loss": 0.7337, "learning_rate": 1.2374307584371104e-05, "epoch": 0.6683749733077088, "percentage": 66.85, "elapsed_time": "12:11:20", "remaining_time": "6:02:38", "throughput": 1131.15, "total_tokens": 49635936}
{"current_steps": 1570, "total_steps": 2341, "loss": 0.6751, "learning_rate": 1.222980869583521e-05, "epoch": 0.6705103566090114, "percentage": 67.07, "elapsed_time": "12:13:04", "remaining_time": "5:59:59", "throughput": 1131.07, "total_tokens": 49749408}
{"current_steps": 1575, "total_steps": 2341, "loss": 0.7597, "learning_rate": 1.2085884760770755e-05, "epoch": 0.672645739910314, "percentage": 67.28, "elapsed_time": "12:15:31", "remaining_time": "5:57:43", "throughput": 1131.08, "total_tokens": 49916512}
{"current_steps": 1580, "total_steps": 2341, "loss": 0.7161, "learning_rate": 1.1942542259078013e-05, "epoch": 0.6747811232116165, "percentage": 67.49, "elapsed_time": "12:17:33", "remaining_time": "5:55:14", "throughput": 1131.07, "total_tokens": 50054080}
{"current_steps": 1585, "total_steps": 2341, "loss": 0.6078, "learning_rate": 1.1799787644479329e-05, "epoch": 0.676916506512919, "percentage": 67.71, "elapsed_time": "12:19:51", "remaining_time": "5:52:53", "throughput": 1131.07, "total_tokens": 50209472}
{"current_steps": 1590, "total_steps": 2341, "loss": 0.7661, "learning_rate": 1.165762734422855e-05, "epoch": 0.6790518898142216, "percentage": 67.92, "elapsed_time": "12:22:18", "remaining_time": "5:50:36", "throughput": 1131.03, "total_tokens": 50374560}
{"current_steps": 1595, "total_steps": 2341, "loss": 0.7189, "learning_rate": 1.1516067758821658e-05, "epoch": 0.6811872731155242, "percentage": 68.13, "elapsed_time": "12:24:34", "remaining_time": "5:48:14", "throughput": 1130.98, "total_tokens": 50525632}
{"current_steps": 1600, "total_steps": 2341, "loss": 0.7739, "learning_rate": 1.13751152617086e-05, "epoch": 0.6833226564168268, "percentage": 68.35, "elapsed_time": "12:26:48", "remaining_time": "5:45:52", "throughput": 1130.99, "total_tokens": 50678080}
{"current_steps": 1605, "total_steps": 2341, "loss": 0.8047, "learning_rate": 1.1234776199006324e-05, "epoch": 0.6854580397181294, "percentage": 68.56, "elapsed_time": "12:29:14", "remaining_time": "5:43:34", "throughput": 1131.04, "total_tokens": 50845056}
{"current_steps": 1610, "total_steps": 2341, "loss": 0.599, "learning_rate": 1.1095056889213073e-05, "epoch": 0.6875934230194319, "percentage": 68.77, "elapsed_time": "12:31:37", "remaining_time": "5:41:15", "throughput": 1131.08, "total_tokens": 51008896}
{"current_steps": 1615, "total_steps": 2341, "loss": 0.6548, "learning_rate": 1.0955963622923896e-05, "epoch": 0.6897288063207345, "percentage": 68.99, "elapsed_time": "12:34:04", "remaining_time": "5:38:59", "throughput": 1131.1, "total_tokens": 51176448}
{"current_steps": 1620, "total_steps": 2341, "loss": 0.6567, "learning_rate": 1.0817502662547426e-05, "epoch": 0.6918641896220371, "percentage": 69.2, "elapsed_time": "12:36:34", "remaining_time": "5:36:43", "throughput": 1131.14, "total_tokens": 51347616}
{"current_steps": 1625, "total_steps": 2341, "loss": 0.5926, "learning_rate": 1.0679680242023946e-05, "epoch": 0.6939995729233397, "percentage": 69.41, "elapsed_time": "12:38:58", "remaining_time": "5:34:25", "throughput": 1131.17, "total_tokens": 51512000}
{"current_steps": 1630, "total_steps": 2341, "loss": 0.8239, "learning_rate": 1.0542502566544668e-05, "epoch": 0.6961349562246423, "percentage": 69.63, "elapsed_time": "12:41:11", "remaining_time": "5:32:01", "throughput": 1131.1, "total_tokens": 51659328}
{"current_steps": 1635, "total_steps": 2341, "loss": 0.7617, "learning_rate": 1.040597581227242e-05, "epoch": 0.6982703395259449, "percentage": 69.84, "elapsed_time": "12:43:20", "remaining_time": "5:29:36", "throughput": 1131.12, "total_tokens": 51806176}
{"current_steps": 1640, "total_steps": 2341, "loss": 0.6469, "learning_rate": 1.0270106126063539e-05, "epoch": 0.7004057228272474, "percentage": 70.06, "elapsed_time": "12:45:12", "remaining_time": "5:27:04", "throughput": 1131.07, "total_tokens": 51930816}
{"current_steps": 1645, "total_steps": 2341, "loss": 0.8937, "learning_rate": 1.0134899625191124e-05, "epoch": 0.70254110612855, "percentage": 70.27, "elapsed_time": "12:47:04", "remaining_time": "5:24:32", "throughput": 1131.04, "total_tokens": 52054944}
{"current_steps": 1650, "total_steps": 2341, "loss": 0.6863, "learning_rate": 1.0000362397069612e-05, "epoch": 0.7046764894298526, "percentage": 70.48, "elapsed_time": "12:49:26", "remaining_time": "5:22:13", "throughput": 1130.99, "total_tokens": 52213536}
{"current_steps": 1655, "total_steps": 2341, "loss": 0.6294, "learning_rate": 9.866500498980744e-06, "epoch": 0.7068118727311552, "percentage": 70.7, "elapsed_time": "12:51:41", "remaining_time": "5:19:51", "throughput": 1131.0, "total_tokens": 52366624}
{"current_steps": 1660, "total_steps": 2341, "loss": 0.644, "learning_rate": 9.733319957800781e-06, "epoch": 0.7089472560324578, "percentage": 70.91, "elapsed_time": "12:53:57", "remaining_time": "5:17:30", "throughput": 1130.96, "total_tokens": 52518688}
{"current_steps": 1665, "total_steps": 2341, "loss": 0.658, "learning_rate": 9.60082676972921e-06, "epoch": 0.7110826393337604, "percentage": 71.12, "elapsed_time": "12:55:59", "remaining_time": "5:15:03", "throughput": 1130.96, "total_tokens": 52656384}
{"current_steps": 1670, "total_steps": 2341, "loss": 0.7008, "learning_rate": 9.469026900018758e-06, "epoch": 0.713218022635063, "percentage": 71.34, "elapsed_time": "12:58:20", "remaining_time": "5:12:44", "throughput": 1130.97, "total_tokens": 52816832}
{"current_steps": 1675, "total_steps": 2341, "loss": 0.6814, "learning_rate": 9.337926282706794e-06, "epoch": 0.7153534059363655, "percentage": 71.55, "elapsed_time": "13:00:45", "remaining_time": "5:10:26", "throughput": 1130.96, "total_tokens": 52979936}
{"current_steps": 1680, "total_steps": 2341, "loss": 0.5933, "learning_rate": 9.20753082034821e-06, "epoch": 0.7174887892376681, "percentage": 71.76, "elapsed_time": "13:03:15", "remaining_time": "5:08:10", "throughput": 1130.98, "total_tokens": 53151136}
{"current_steps": 1685, "total_steps": 2341, "loss": 0.7048, "learning_rate": 9.077846383749631e-06, "epoch": 0.7196241725389707, "percentage": 71.98, "elapsed_time": "13:06:28", "remaining_time": "5:06:11", "throughput": 1131.12, "total_tokens": 53375680}
{"current_steps": 1690, "total_steps": 2341, "loss": 0.7039, "learning_rate": 8.948878811705109e-06, "epoch": 0.7217595558402733, "percentage": 72.19, "elapsed_time": "13:09:07", "remaining_time": "5:03:58", "throughput": 1131.17, "total_tokens": 53558240}
{"current_steps": 1695, "total_steps": 2341, "loss": 0.7525, "learning_rate": 8.820633910733237e-06, "epoch": 0.7238949391415759, "percentage": 72.4, "elapsed_time": "13:11:50", "remaining_time": "5:01:47", "throughput": 1131.21, "total_tokens": 53744960}
{"current_steps": 1700, "total_steps": 2341, "loss": 0.595, "learning_rate": 8.693117454815728e-06, "epoch": 0.7260303224428785, "percentage": 72.62, "elapsed_time": "13:13:55", "remaining_time": "4:59:21", "throughput": 1131.17, "total_tokens": 53884480}
{"current_steps": 1705, "total_steps": 2341, "loss": 0.5853, "learning_rate": 8.566335185137437e-06, "epoch": 0.728165705744181, "percentage": 72.83, "elapsed_time": "13:16:43", "remaining_time": "4:57:11", "throughput": 1131.26, "total_tokens": 54077792}
{"current_steps": 1710, "total_steps": 2341, "loss": 0.7973, "learning_rate": 8.440292809827898e-06, "epoch": 0.7303010890454836, "percentage": 73.05, "elapsed_time": "13:19:12", "remaining_time": "4:54:54", "throughput": 1131.25, "total_tokens": 54246368}
{"current_steps": 1715, "total_steps": 2341, "loss": 0.8046, "learning_rate": 8.314996003704305e-06, "epoch": 0.7324364723467862, "percentage": 73.26, "elapsed_time": "13:21:47", "remaining_time": "4:52:39", "throughput": 1131.27, "total_tokens": 54422240}
{"current_steps": 1720, "total_steps": 2341, "loss": 0.5263, "learning_rate": 8.190450408016032e-06, "epoch": 0.7345718556480888, "percentage": 73.47, "elapsed_time": "13:24:02", "remaining_time": "4:50:17", "throughput": 1131.25, "total_tokens": 54574592}
{"current_steps": 1725, "total_steps": 2341, "loss": 0.6577, "learning_rate": 8.06666163019063e-06, "epoch": 0.7367072389493914, "percentage": 73.69, "elapsed_time": "13:26:20", "remaining_time": "4:47:56", "throughput": 1131.21, "total_tokens": 54728160}
{"current_steps": 1730, "total_steps": 2341, "loss": 0.6628, "learning_rate": 7.943635243581373e-06, "epoch": 0.738842622250694, "percentage": 73.9, "elapsed_time": "13:28:47", "remaining_time": "4:45:38", "throughput": 1131.22, "total_tokens": 54895072}
{"current_steps": 1735, "total_steps": 2341, "loss": 0.6087, "learning_rate": 7.821376787216333e-06, "epoch": 0.7409780055519966, "percentage": 74.11, "elapsed_time": "13:31:22", "remaining_time": "4:43:23", "throughput": 1131.26, "total_tokens": 55072256}
{"current_steps": 1740, "total_steps": 2341, "loss": 0.6766, "learning_rate": 7.699891765548983e-06, "epoch": 0.7431133888532991, "percentage": 74.33, "elapsed_time": "13:33:49", "remaining_time": "4:41:05", "throughput": 1131.25, "total_tokens": 55237888}
{"current_steps": 1745, "total_steps": 2341, "loss": 0.6222, "learning_rate": 7.5791856482103765e-06, "epoch": 0.7452487721546017, "percentage": 74.54, "elapsed_time": "13:36:09", "remaining_time": "4:38:45", "throughput": 1131.27, "total_tokens": 55398048}
{"current_steps": 1750, "total_steps": 2341, "loss": 0.6083, "learning_rate": 7.459263869762892e-06, "epoch": 0.7473841554559043, "percentage": 74.75, "elapsed_time": "13:38:32", "remaining_time": "4:36:25", "throughput": 1131.25, "total_tokens": 55558336}
{"current_steps": 1755, "total_steps": 2341, "loss": 0.7643, "learning_rate": 7.340131829455541e-06, "epoch": 0.7495195387572069, "percentage": 74.97, "elapsed_time": "13:40:54", "remaining_time": "4:34:06", "throughput": 1131.23, "total_tokens": 55717888}
{"current_steps": 1760, "total_steps": 2341, "loss": 0.6745, "learning_rate": 7.221794890980888e-06, "epoch": 0.7516549220585095, "percentage": 75.18, "elapsed_time": "13:43:28", "remaining_time": "4:31:50", "throughput": 1131.27, "total_tokens": 55894816}
{"current_steps": 1765, "total_steps": 2341, "loss": 0.6846, "learning_rate": 7.104258382233556e-06, "epoch": 0.7537903053598121, "percentage": 75.4, "elapsed_time": "13:46:02", "remaining_time": "4:29:34", "throughput": 1131.32, "total_tokens": 56071360}
{"current_steps": 1770, "total_steps": 2341, "loss": 0.625, "learning_rate": 6.987527595070356e-06, "epoch": 0.7559256886611146, "percentage": 75.61, "elapsed_time": "13:47:50", "remaining_time": "4:27:03", "throughput": 1131.23, "total_tokens": 56188384}
{"current_steps": 1775, "total_steps": 2341, "loss": 0.6852, "learning_rate": 6.871607785071999e-06, "epoch": 0.7580610719624172, "percentage": 75.82, "elapsed_time": "13:50:26", "remaining_time": "4:24:48", "throughput": 1131.24, "total_tokens": 56365312}
{"current_steps": 1780, "total_steps": 2341, "loss": 0.7002, "learning_rate": 6.756504171306521e-06, "epoch": 0.7601964552637198, "percentage": 76.04, "elapsed_time": "13:52:33", "remaining_time": "4:22:23", "throughput": 1131.24, "total_tokens": 56509120}
{"current_steps": 1785, "total_steps": 2341, "loss": 0.7087, "learning_rate": 6.642221936094281e-06, "epoch": 0.7623318385650224, "percentage": 76.25, "elapsed_time": "13:54:40", "remaining_time": "4:19:59", "throughput": 1131.22, "total_tokens": 56652384}
{"current_steps": 1790, "total_steps": 2341, "loss": 0.5355, "learning_rate": 6.528766224774619e-06, "epoch": 0.764467221866325, "percentage": 76.46, "elapsed_time": "13:56:51", "remaining_time": "4:17:36", "throughput": 1131.15, "total_tokens": 56796704}
{"current_steps": 1795, "total_steps": 2341, "loss": 0.727, "learning_rate": 6.416142145474244e-06, "epoch": 0.7666026051676276, "percentage": 76.68, "elapsed_time": "13:59:27", "remaining_time": "4:15:20", "throughput": 1131.2, "total_tokens": 56975872}
{"current_steps": 1800, "total_steps": 2341, "loss": 0.7101, "learning_rate": 6.304354768877196e-06, "epoch": 0.7687379884689302, "percentage": 76.89, "elapsed_time": "14:01:57", "remaining_time": "4:13:03", "throughput": 1131.24, "total_tokens": 57147296}
{"current_steps": 1805, "total_steps": 2341, "loss": 0.799, "learning_rate": 6.1934091279965915e-06, "epoch": 0.7708733717702327, "percentage": 77.1, "elapsed_time": "14:04:13", "remaining_time": "4:10:41", "throughput": 1131.27, "total_tokens": 57302368}
{"current_steps": 1810, "total_steps": 2341, "loss": 0.6874, "learning_rate": 6.083310217947991e-06, "epoch": 0.7730087550715353, "percentage": 77.32, "elapsed_time": "14:06:41", "remaining_time": "4:08:23", "throughput": 1131.29, "total_tokens": 57471200}
{"current_steps": 1815, "total_steps": 2341, "loss": 0.7995, "learning_rate": 5.974062995724527e-06, "epoch": 0.7751441383728379, "percentage": 77.53, "elapsed_time": "14:09:42", "remaining_time": "4:06:15", "throughput": 1131.36, "total_tokens": 57679840}
{"current_steps": 1820, "total_steps": 2341, "loss": 0.6763, "learning_rate": 5.865672379973702e-06, "epoch": 0.7772795216741405, "percentage": 77.74, "elapsed_time": "14:12:11", "remaining_time": "4:03:57", "throughput": 1131.37, "total_tokens": 57849248}
{"current_steps": 1825, "total_steps": 2341, "loss": 0.5619, "learning_rate": 5.75814325077596e-06, "epoch": 0.7794149049754431, "percentage": 77.96, "elapsed_time": "14:14:20", "remaining_time": "4:01:33", "throughput": 1131.36, "total_tokens": 57993952}
{"current_steps": 1830, "total_steps": 2341, "loss": 0.6884, "learning_rate": 5.651480449424954e-06, "epoch": 0.7815502882767457, "percentage": 78.17, "elapsed_time": "14:16:34", "remaining_time": "3:59:11", "throughput": 1131.37, "total_tokens": 58146592}
{"current_steps": 1835, "total_steps": 2341, "loss": 0.7584, "learning_rate": 5.545688778209579e-06, "epoch": 0.7836856715780482, "percentage": 78.39, "elapsed_time": "14:18:57", "remaining_time": "3:56:51", "throughput": 1131.36, "total_tokens": 58307808}
{"current_steps": 1840, "total_steps": 2341, "loss": 0.7216, "learning_rate": 5.440773000197763e-06, "epoch": 0.7858210548793508, "percentage": 78.6, "elapsed_time": "14:21:12", "remaining_time": "3:54:29", "throughput": 1131.4, "total_tokens": 58462528}
{"current_steps": 1845, "total_steps": 2341, "loss": 0.5983, "learning_rate": 5.3367378390220184e-06, "epoch": 0.7879564381806534, "percentage": 78.81, "elapsed_time": "14:23:37", "remaining_time": "3:52:10", "throughput": 1131.41, "total_tokens": 58626784}
{"current_steps": 1850, "total_steps": 2341, "loss": 0.5874, "learning_rate": 5.233587978666754e-06, "epoch": 0.790091821481956, "percentage": 79.03, "elapsed_time": "14:26:15", "remaining_time": "3:49:54", "throughput": 1131.4, "total_tokens": 58805760}
{"current_steps": 1855, "total_steps": 2341, "loss": 0.6549, "learning_rate": 5.131328063257415e-06, "epoch": 0.7922272047832586, "percentage": 79.24, "elapsed_time": "14:28:54", "remaining_time": "3:47:39", "throughput": 1131.47, "total_tokens": 58989248}
{"current_steps": 1860, "total_steps": 2341, "loss": 0.7086, "learning_rate": 5.029962696851365e-06, "epoch": 0.7943625880845612, "percentage": 79.45, "elapsed_time": "14:30:58", "remaining_time": "3:45:14", "throughput": 1131.44, "total_tokens": 59127904}
{"current_steps": 1865, "total_steps": 2341, "loss": 0.6751, "learning_rate": 4.9294964432306105e-06, "epoch": 0.7964979713858638, "percentage": 79.67, "elapsed_time": "14:33:22", "remaining_time": "3:42:54", "throughput": 1131.44, "total_tokens": 59290880}
{"current_steps": 1870, "total_steps": 2341, "loss": 0.6631, "learning_rate": 4.829933825696328e-06, "epoch": 0.7986333546871663, "percentage": 79.88, "elapsed_time": "14:35:46", "remaining_time": "3:40:35", "throughput": 1131.44, "total_tokens": 59453504}
{"current_steps": 1875, "total_steps": 2341, "loss": 0.6248, "learning_rate": 4.731279326865193e-06, "epoch": 0.8007687379884689, "percentage": 80.09, "elapsed_time": "14:38:21", "remaining_time": "3:38:18", "throughput": 1131.45, "total_tokens": 59628704}
{"current_steps": 1880, "total_steps": 2341, "loss": 0.6742, "learning_rate": 4.633537388467582e-06, "epoch": 0.8029041212897715, "percentage": 80.31, "elapsed_time": "14:40:28", "remaining_time": "3:35:54", "throughput": 1131.41, "total_tokens": 59770720}
{"current_steps": 1885, "total_steps": 2341, "loss": 0.6084, "learning_rate": 4.536712411147573e-06, "epoch": 0.8050395045910741, "percentage": 80.52, "elapsed_time": "14:42:48", "remaining_time": "3:33:33", "throughput": 1131.41, "total_tokens": 59929280}
{"current_steps": 1890, "total_steps": 2341, "loss": 0.7314, "learning_rate": 4.4408087542648334e-06, "epoch": 0.8071748878923767, "percentage": 80.73, "elapsed_time": "14:44:36", "remaining_time": "3:31:05", "throughput": 1131.3, "total_tokens": 60045152}
{"current_steps": 1895, "total_steps": 2341, "loss": 0.6492, "learning_rate": 4.345830735698322e-06, "epoch": 0.8093102711936793, "percentage": 80.95, "elapsed_time": "14:46:24", "remaining_time": "3:28:37", "throughput": 1131.22, "total_tokens": 60163840}
{"current_steps": 1900, "total_steps": 2341, "loss": 0.7565, "learning_rate": 4.251782631651918e-06, "epoch": 0.8114456544949818, "percentage": 81.16, "elapsed_time": "14:48:48", "remaining_time": "3:26:17", "throughput": 1131.27, "total_tokens": 60329152}
{"current_steps": 1905, "total_steps": 2341, "loss": 0.6302, "learning_rate": 4.158668676461866e-06, "epoch": 0.8135810377962844, "percentage": 81.38, "elapsed_time": "14:50:40", "remaining_time": "3:23:50", "throughput": 1131.2, "total_tokens": 60451264}
{"current_steps": 1910, "total_steps": 2341, "loss": 0.6156, "learning_rate": 4.0664930624061375e-06, "epoch": 0.815716421097587, "percentage": 81.59, "elapsed_time": "14:52:57", "remaining_time": "3:21:29", "throughput": 1131.21, "total_tokens": 60607008}
{"current_steps": 1915, "total_steps": 2341, "loss": 0.6657, "learning_rate": 3.975259939515708e-06, "epoch": 0.8178518043988896, "percentage": 81.8, "elapsed_time": "14:55:15", "remaining_time": "3:19:09", "throughput": 1131.22, "total_tokens": 60764064}
{"current_steps": 1920, "total_steps": 2341, "loss": 0.834, "learning_rate": 3.884973415387652e-06, "epoch": 0.8199871877001922, "percentage": 82.02, "elapsed_time": "14:57:33", "remaining_time": "3:16:48", "throughput": 1131.21, "total_tokens": 60919072}
{"current_steps": 1925, "total_steps": 2341, "loss": 0.6426, "learning_rate": 3.79563755500027e-06, "epoch": 0.8221225710014948, "percentage": 82.23, "elapsed_time": "14:59:50", "remaining_time": "3:14:27", "throughput": 1131.22, "total_tokens": 61074976}
{"current_steps": 1930, "total_steps": 2341, "loss": 0.7106, "learning_rate": 3.7072563805300497e-06, "epoch": 0.8242579543027974, "percentage": 82.44, "elapsed_time": "15:01:49", "remaining_time": "3:12:02", "throughput": 1131.2, "total_tokens": 61209088}
{"current_steps": 1935, "total_steps": 2341, "loss": 0.724, "learning_rate": 3.61983387117055e-06, "epoch": 0.8263933376040999, "percentage": 82.66, "elapsed_time": "15:04:10", "remaining_time": "3:09:42", "throughput": 1131.19, "total_tokens": 61367360}
{"current_steps": 1940, "total_steps": 2341, "loss": 0.7054, "learning_rate": 3.533373962953271e-06, "epoch": 0.8285287209054025, "percentage": 82.87, "elapsed_time": "15:06:15", "remaining_time": "3:07:19", "throughput": 1131.16, "total_tokens": 61506976}
{"current_steps": 1945, "total_steps": 2341, "loss": 0.5991, "learning_rate": 3.447880548570434e-06, "epoch": 0.8306641042067051, "percentage": 83.08, "elapsed_time": "15:08:32", "remaining_time": "3:04:58", "throughput": 1131.13, "total_tokens": 61661280}
{"current_steps": 1950, "total_steps": 2341, "loss": 0.8037, "learning_rate": 3.3633574771997245e-06, "epoch": 0.8327994875080077, "percentage": 83.3, "elapsed_time": "15:10:48", "remaining_time": "3:02:37", "throughput": 1131.11, "total_tokens": 61813056}
{"current_steps": 1955, "total_steps": 2341, "loss": 0.7369, "learning_rate": 3.2798085543309847e-06, "epoch": 0.8349348708093103, "percentage": 83.51, "elapsed_time": "15:13:08", "remaining_time": "3:00:17", "throughput": 1131.09, "total_tokens": 61970752}
{"current_steps": 1960, "total_steps": 2341, "loss": 0.5092, "learning_rate": 3.1972375415948884e-06, "epoch": 0.8370702541106129, "percentage": 83.72, "elapsed_time": "15:14:56", "remaining_time": "2:57:51", "throughput": 1130.95, "total_tokens": 62085728}
{"current_steps": 1965, "total_steps": 2341, "loss": 0.5488, "learning_rate": 3.1156481565935563e-06, "epoch": 0.8392056374119155, "percentage": 83.94, "elapsed_time": "15:17:08", "remaining_time": "2:55:29", "throughput": 1130.9, "total_tokens": 62232288}
{"current_steps": 1970, "total_steps": 2341, "loss": 0.8189, "learning_rate": 3.035044072733209e-06, "epoch": 0.841341020713218, "percentage": 84.15, "elapsed_time": "15:19:49", "remaining_time": "2:53:13", "throughput": 1130.98, "total_tokens": 62418272}
{"current_steps": 1975, "total_steps": 2341, "loss": 0.7843, "learning_rate": 2.955428919058767e-06, "epoch": 0.8434764040145206, "percentage": 84.37, "elapsed_time": "15:21:55", "remaining_time": "2:50:50", "throughput": 1130.97, "total_tokens": 62560416}
{"current_steps": 1980, "total_steps": 2341, "loss": 0.6783, "learning_rate": 2.876806280090449e-06, "epoch": 0.8456117873158232, "percentage": 84.58, "elapsed_time": "15:24:12", "remaining_time": "2:48:30", "throughput": 1130.93, "total_tokens": 62713120}
{"current_steps": 1985, "total_steps": 2341, "loss": 0.6642, "learning_rate": 2.7991796956624017e-06, "epoch": 0.8477471706171258, "percentage": 84.79, "elapsed_time": "15:27:00", "remaining_time": "2:46:15", "throughput": 1130.99, "total_tokens": 62906304}
{"current_steps": 1990, "total_steps": 2341, "loss": 0.697, "learning_rate": 2.7225526607633167e-06, "epoch": 0.8498825539184284, "percentage": 85.01, "elapsed_time": "15:29:02", "remaining_time": "2:43:51", "throughput": 1130.98, "total_tokens": 63043552}
{"current_steps": 1995, "total_steps": 2341, "loss": 0.549, "learning_rate": 2.6469286253790777e-06, "epoch": 0.852017937219731, "percentage": 85.22, "elapsed_time": "15:31:15", "remaining_time": "2:41:30", "throughput": 1130.95, "total_tokens": 63192608}
{"current_steps": 2000, "total_steps": 2341, "loss": 0.8259, "learning_rate": 2.5723109943374264e-06, "epoch": 0.8541533205210335, "percentage": 85.43, "elapsed_time": "15:33:56", "remaining_time": "2:39:14", "throughput": 1131.03, "total_tokens": 63379296}
{"current_steps": 2005, "total_steps": 2341, "loss": 0.6236, "learning_rate": 2.4987031271546753e-06, "epoch": 0.8562887038223361, "percentage": 85.65, "elapsed_time": "15:36:23", "remaining_time": "2:36:55", "throughput": 1130.94, "total_tokens": 63540576}
{"current_steps": 2010, "total_steps": 2341, "loss": 0.6153, "learning_rate": 2.4261083378844557e-06, "epoch": 0.8584240871236387, "percentage": 85.86, "elapsed_time": "15:38:51", "remaining_time": "2:34:36", "throughput": 1131.0, "total_tokens": 63710688}
{"current_steps": 2015, "total_steps": 2341, "loss": 0.6785, "learning_rate": 2.354529894968485e-06, "epoch": 0.8605594704249413, "percentage": 86.07, "elapsed_time": "15:41:19", "remaining_time": "2:32:17", "throughput": 1131.03, "total_tokens": 63879584}
{"current_steps": 2020, "total_steps": 2341, "loss": 0.6377, "learning_rate": 2.2839710210894372e-06, "epoch": 0.8626948537262439, "percentage": 86.29, "elapsed_time": "15:43:22", "remaining_time": "2:29:54", "throughput": 1130.97, "total_tokens": 64015744}
{"current_steps": 2025, "total_steps": 2341, "loss": 0.4801, "learning_rate": 2.214434893025838e-06, "epoch": 0.8648302370275465, "percentage": 86.5, "elapsed_time": "15:45:52", "remaining_time": "2:27:36", "throughput": 1131.0, "total_tokens": 64187232}
{"current_steps": 2030, "total_steps": 2341, "loss": 0.7073, "learning_rate": 2.1459246415090312e-06, "epoch": 0.866965620328849, "percentage": 86.72, "elapsed_time": "15:48:00", "remaining_time": "2:25:14", "throughput": 1131.01, "total_tokens": 64331968}
{"current_steps": 2035, "total_steps": 2341, "loss": 0.7264, "learning_rate": 2.078443351082232e-06, "epoch": 0.8691010036301516, "percentage": 86.93, "elapsed_time": "15:50:13", "remaining_time": "2:22:53", "throughput": 1131.0, "total_tokens": 64482816}
{"current_steps": 2040, "total_steps": 2341, "loss": 0.7054, "learning_rate": 2.011994059961647e-06, "epoch": 0.8712363869314542, "percentage": 87.14, "elapsed_time": "15:52:26", "remaining_time": "2:20:31", "throughput": 1131.02, "total_tokens": 64634368}
{"current_steps": 2045, "total_steps": 2341, "loss": 0.7034, "learning_rate": 1.9465797598996914e-06, "epoch": 0.8733717702327568, "percentage": 87.36, "elapsed_time": "15:54:45", "remaining_time": "2:18:11", "throughput": 1130.96, "total_tokens": 64787424}
{"current_steps": 2050, "total_steps": 2341, "loss": 0.593, "learning_rate": 1.8822033960502722e-06, "epoch": 0.8755071535340594, "percentage": 87.57, "elapsed_time": "15:56:57", "remaining_time": "2:15:50", "throughput": 1130.93, "total_tokens": 64935616}
{"current_steps": 2055, "total_steps": 2341, "loss": 0.7639, "learning_rate": 1.8188678668362102e-06, "epoch": 0.877642536835362, "percentage": 87.78, "elapsed_time": "15:59:25", "remaining_time": "2:13:31", "throughput": 1130.95, "total_tokens": 65103392}
{"current_steps": 2060, "total_steps": 2341, "loss": 0.6378, "learning_rate": 1.7565760238187401e-06, "epoch": 0.8797779201366646, "percentage": 88.0, "elapsed_time": "16:01:24", "remaining_time": "2:11:08", "throughput": 1130.92, "total_tokens": 65236032}
{"current_steps": 2065, "total_steps": 2341, "loss": 0.572, "learning_rate": 1.6953306715690925e-06, "epoch": 0.8819133034379671, "percentage": 88.21, "elapsed_time": "16:03:27", "remaining_time": "2:08:46", "throughput": 1130.91, "total_tokens": 65374432}
{"current_steps": 2070, "total_steps": 2341, "loss": 0.6153, "learning_rate": 1.6351345675422874e-06, "epoch": 0.8840486867392697, "percentage": 88.42, "elapsed_time": "16:06:04", "remaining_time": "2:06:28", "throughput": 1130.94, "total_tokens": 65554048}
{"current_steps": 2075, "total_steps": 2341, "loss": 0.7024, "learning_rate": 1.5759904219529249e-06, "epoch": 0.8861840700405723, "percentage": 88.64, "elapsed_time": "16:08:30", "remaining_time": "2:04:09", "throughput": 1130.94, "total_tokens": 65719584}
{"current_steps": 2080, "total_steps": 2341, "loss": 0.6698, "learning_rate": 1.5179008976531878e-06, "epoch": 0.8883194533418749, "percentage": 88.85, "elapsed_time": "16:11:18", "remaining_time": "2:01:52", "throughput": 1130.98, "total_tokens": 65911616}
{"current_steps": 2085, "total_steps": 2341, "loss": 0.7602, "learning_rate": 1.4608686100129553e-06, "epoch": 0.8904548366431775, "percentage": 89.06, "elapsed_time": "16:13:46", "remaining_time": "1:59:33", "throughput": 1131.01, "total_tokens": 66080480}
{"current_steps": 2090, "total_steps": 2341, "loss": 0.5967, "learning_rate": 1.4048961268020384e-06, "epoch": 0.8925902199444801, "percentage": 89.28, "elapsed_time": "16:16:04", "remaining_time": "1:57:13", "throughput": 1131.02, "total_tokens": 66237376}
{"current_steps": 2095, "total_steps": 2341, "loss": 0.7729, "learning_rate": 1.3499859680745852e-06, "epoch": 0.8947256032457827, "percentage": 89.49, "elapsed_time": "16:18:29", "remaining_time": "1:54:53", "throughput": 1131.06, "total_tokens": 66404128}
{"current_steps": 2100, "total_steps": 2341, "loss": 0.7682, "learning_rate": 1.2961406060556097e-06, "epoch": 0.8968609865470852, "percentage": 89.71, "elapsed_time": "16:21:08", "remaining_time": "1:52:35", "throughput": 1131.13, "total_tokens": 66587872}
{"current_steps": 2105, "total_steps": 2341, "loss": 0.8945, "learning_rate": 1.2433624650296905e-06, "epoch": 0.8989963698483878, "percentage": 89.92, "elapsed_time": "16:22:58", "remaining_time": "1:50:12", "throughput": 1131.06, "total_tokens": 66708672}
{"current_steps": 2110, "total_steps": 2341, "loss": 0.5526, "learning_rate": 1.191653921231811e-06, "epoch": 0.9011317531496904, "percentage": 90.13, "elapsed_time": "16:25:13", "remaining_time": "1:47:51", "throughput": 1131.09, "total_tokens": 66862912}
{"current_steps": 2115, "total_steps": 2341, "loss": 0.6192, "learning_rate": 1.1410173027403882e-06, "epoch": 0.903267136450993, "percentage": 90.35, "elapsed_time": "16:26:59", "remaining_time": "1:45:27", "throughput": 1130.99, "total_tokens": 66976480}
{"current_steps": 2120, "total_steps": 2341, "loss": 0.6662, "learning_rate": 1.0914548893724563e-06, "epoch": 0.9054025197522956, "percentage": 90.56, "elapsed_time": "16:29:35", "remaining_time": "1:43:09", "throughput": 1131.04, "total_tokens": 67155712}
{"current_steps": 2125, "total_steps": 2341, "loss": 0.6332, "learning_rate": 1.042968912581005e-06, "epoch": 0.9075379030535982, "percentage": 90.77, "elapsed_time": "16:31:34", "remaining_time": "1:40:47", "throughput": 1131.0, "total_tokens": 67288000}
{"current_steps": 2130, "total_steps": 2341, "loss": 0.8033, "learning_rate": 9.955615553545295e-07, "epoch": 0.9096732863549007, "percentage": 90.99, "elapsed_time": "16:33:44", "remaining_time": "1:38:26", "throughput": 1131.03, "total_tokens": 67437632}
{"current_steps": 2135, "total_steps": 2341, "loss": 0.6562, "learning_rate": 9.492349521187355e-07, "epoch": 0.9118086696562033, "percentage": 91.2, "elapsed_time": "16:35:55", "remaining_time": "1:36:05", "throughput": 1131.02, "total_tokens": 67584288}
{"current_steps": 2140, "total_steps": 2341, "loss": 0.6629, "learning_rate": 9.039911886404462e-07, "epoch": 0.9139440529575059, "percentage": 91.41, "elapsed_time": "16:38:13", "remaining_time": "1:33:45", "throughput": 1131.02, "total_tokens": 67741024}
{"current_steps": 2145, "total_steps": 2341, "loss": 0.7827, "learning_rate": 8.59832301933694e-07, "epoch": 0.9160794362588085, "percentage": 91.63, "elapsed_time": "16:40:38", "remaining_time": "1:31:26", "throughput": 1131.03, "total_tokens": 67904928}
{"current_steps": 2150, "total_steps": 2341, "loss": 0.6068, "learning_rate": 8.16760280168008e-07, "epoch": 0.9182148195601111, "percentage": 91.84, "elapsed_time": "16:43:15", "remaining_time": "1:29:07", "throughput": 1131.05, "total_tokens": 68084128}
{"current_steps": 2155, "total_steps": 2341, "loss": 0.6923, "learning_rate": 7.747770625788964e-07, "epoch": 0.9203502028614137, "percentage": 92.05, "elapsed_time": "16:45:44", "remaining_time": "1:26:48", "throughput": 1131.05, "total_tokens": 68252704}
{"current_steps": 2160, "total_steps": 2341, "loss": 0.6895, "learning_rate": 7.338845393805388e-07, "epoch": 0.9224855861627163, "percentage": 92.27, "elapsed_time": "16:47:36", "remaining_time": "1:24:26", "throughput": 1130.99, "total_tokens": 68375360}
{"current_steps": 2165, "total_steps": 2341, "loss": 0.721, "learning_rate": 6.940845516806849e-07, "epoch": 0.9246209694640188, "percentage": 92.48, "elapsed_time": "16:50:02", "remaining_time": "1:22:06", "throughput": 1131.01, "total_tokens": 68542272}
{"current_steps": 2170, "total_steps": 2341, "loss": 0.7807, "learning_rate": 6.553788913977593e-07, "epoch": 0.9267563527653214, "percentage": 92.7, "elapsed_time": "16:52:26", "remaining_time": "1:19:46", "throughput": 1130.99, "total_tokens": 68703584}
{"current_steps": 2175, "total_steps": 2341, "loss": 0.6796, "learning_rate": 6.177693011801877e-07, "epoch": 0.928891736066624, "percentage": 92.91, "elapsed_time": "16:54:33", "remaining_time": "1:17:26", "throughput": 1130.96, "total_tokens": 68845760}
{"current_steps": 2180, "total_steps": 2341, "loss": 0.6509, "learning_rate": 5.812574743279286e-07, "epoch": 0.9310271193679266, "percentage": 93.12, "elapsed_time": "16:57:14", "remaining_time": "1:15:07", "throughput": 1131.01, "total_tokens": 69031072}
{"current_steps": 2185, "total_steps": 2341, "loss": 0.7432, "learning_rate": 5.458450547162486e-07, "epoch": 0.9331625026692292, "percentage": 93.34, "elapsed_time": "16:59:47", "remaining_time": "1:12:48", "throughput": 1131.07, "total_tokens": 69207200}
{"current_steps": 2190, "total_steps": 2341, "loss": 0.6785, "learning_rate": 5.115336367217005e-07, "epoch": 0.9352978859705318, "percentage": 93.55, "elapsed_time": "17:02:15", "remaining_time": "1:10:29", "throughput": 1131.07, "total_tokens": 69374944}
{"current_steps": 2195, "total_steps": 2341, "loss": 0.561, "learning_rate": 4.783247651503398e-07, "epoch": 0.9374332692718343, "percentage": 93.76, "elapsed_time": "17:04:31", "remaining_time": "1:08:08", "throughput": 1131.05, "total_tokens": 69527520}
{"current_steps": 2200, "total_steps": 2341, "loss": 0.6363, "learning_rate": 4.4621993516818227e-07, "epoch": 0.9395686525731369, "percentage": 93.98, "elapsed_time": "17:06:53", "remaining_time": "1:05:48", "throughput": 1131.05, "total_tokens": 69688256}
{"current_steps": 2205, "total_steps": 2341, "loss": 0.6927, "learning_rate": 4.152205922338698e-07, "epoch": 0.9417040358744395, "percentage": 94.19, "elapsed_time": "17:09:17", "remaining_time": "1:03:29", "throughput": 1131.06, "total_tokens": 69851776}
{"current_steps": 2210, "total_steps": 2341, "loss": 0.6462, "learning_rate": 3.8532813203360775e-07, "epoch": 0.9438394191757421, "percentage": 94.4, "elapsed_time": "17:11:44", "remaining_time": "1:01:09", "throughput": 1131.05, "total_tokens": 70017856}
{"current_steps": 2215, "total_steps": 2341, "loss": 0.6962, "learning_rate": 3.565439004183241e-07, "epoch": 0.9459748024770446, "percentage": 94.62, "elapsed_time": "17:13:44", "remaining_time": "0:58:48", "throughput": 1131.06, "total_tokens": 70153888}
{"current_steps": 2220, "total_steps": 2341, "loss": 0.6935, "learning_rate": 3.288691933430621e-07, "epoch": 0.9481101857783472, "percentage": 94.83, "elapsed_time": "17:15:48", "remaining_time": "0:56:27", "throughput": 1131.05, "total_tokens": 70292832}
{"current_steps": 2225, "total_steps": 2341, "loss": 0.6684, "learning_rate": 3.023052568086493e-07, "epoch": 0.9502455690796497, "percentage": 95.04, "elapsed_time": "17:18:05", "remaining_time": "0:54:07", "throughput": 1131.05, "total_tokens": 70448448}
{"current_steps": 2230, "total_steps": 2341, "loss": 0.7058, "learning_rate": 2.768532868055923e-07, "epoch": 0.9523809523809523, "percentage": 95.26, "elapsed_time": "17:20:15", "remaining_time": "0:51:46", "throughput": 1131.05, "total_tokens": 70595488}
{"current_steps": 2235, "total_steps": 2341, "loss": 0.6543, "learning_rate": 2.5251442926021715e-07, "epoch": 0.9545163356822549, "percentage": 95.47, "elapsed_time": "17:22:36", "remaining_time": "0:49:26", "throughput": 1131.08, "total_tokens": 70756416}
{"current_steps": 2240, "total_steps": 2341, "loss": 0.727, "learning_rate": 2.292897799831051e-07, "epoch": 0.9566517189835575, "percentage": 95.69, "elapsed_time": "17:25:18", "remaining_time": "0:47:07", "throughput": 1131.17, "total_tokens": 70944896}
{"current_steps": 2245, "total_steps": 2341, "loss": 0.6602, "learning_rate": 2.0718038461972345e-07, "epoch": 0.9587871022848601, "percentage": 95.9, "elapsed_time": "17:27:21", "remaining_time": "0:44:47", "throughput": 1131.16, "total_tokens": 71083616}
{"current_steps": 2250, "total_steps": 2341, "loss": 0.6301, "learning_rate": 1.8618723860336916e-07, "epoch": 0.9609224855861627, "percentage": 96.11, "elapsed_time": "17:29:39", "remaining_time": "0:42:27", "throughput": 1131.17, "total_tokens": 71240480}
{"current_steps": 2255, "total_steps": 2341, "loss": 0.6893, "learning_rate": 1.663112871103406e-07, "epoch": 0.9630578688874653, "percentage": 96.33, "elapsed_time": "17:32:21", "remaining_time": "0:40:08", "throughput": 1131.23, "total_tokens": 71427648}
{"current_steps": 2260, "total_steps": 2341, "loss": 0.6536, "learning_rate": 1.4755342501739377e-07, "epoch": 0.9651932521887678, "percentage": 96.54, "elapsed_time": "17:34:46", "remaining_time": "0:37:48", "throughput": 1131.23, "total_tokens": 71591648}
{"current_steps": 2265, "total_steps": 2341, "loss": 0.7046, "learning_rate": 1.2991449686143852e-07, "epoch": 0.9673286354900704, "percentage": 96.75, "elapsed_time": "17:36:52", "remaining_time": "0:35:27", "throughput": 1131.24, "total_tokens": 71735296}
{"current_steps": 2270, "total_steps": 2341, "loss": 0.559, "learning_rate": 1.1339529680152173e-07, "epoch": 0.969464018791373, "percentage": 96.97, "elapsed_time": "17:38:49", "remaining_time": "0:33:07", "throughput": 1131.16, "total_tokens": 71861920}
{"current_steps": 2275, "total_steps": 2341, "loss": 0.7401, "learning_rate": 9.799656858307527e-08, "epoch": 0.9715994020926756, "percentage": 97.18, "elapsed_time": "17:41:16", "remaining_time": "0:30:47", "throughput": 1131.18, "total_tokens": 72029568}
{"current_steps": 2280, "total_steps": 2341, "loss": 0.5554, "learning_rate": 8.37190055044207e-08, "epoch": 0.9737347853939782, "percentage": 97.39, "elapsed_time": "17:43:19", "remaining_time": "0:28:26", "throughput": 1131.14, "total_tokens": 72166464}
{"current_steps": 2285, "total_steps": 2341, "loss": 0.6366, "learning_rate": 7.056325038556911e-08, "epoch": 0.9758701686952808, "percentage": 97.61, "elapsed_time": "17:45:42", "remaining_time": "0:26:07", "throughput": 1131.12, "total_tokens": 72326496}
{"current_steps": 2290, "total_steps": 2341, "loss": 0.5862, "learning_rate": 5.8529895539266575e-08, "epoch": 0.9780055519965833, "percentage": 97.82, "elapsed_time": "17:47:29", "remaining_time": "0:23:46", "throughput": 1131.06, "total_tokens": 72443616}
{"current_steps": 2295, "total_steps": 2341, "loss": 0.7018, "learning_rate": 4.7619482744326595e-08, "epoch": 0.9801409352978859, "percentage": 98.04, "elapsed_time": "17:50:05", "remaining_time": "0:21:26", "throughput": 1131.12, "total_tokens": 72624032}
{"current_steps": 2300, "total_steps": 2341, "loss": 0.642, "learning_rate": 3.7832503221249535e-08, "epoch": 0.9822763185991885, "percentage": 98.25, "elapsed_time": "17:52:37", "remaining_time": "0:19:07", "throughput": 1131.14, "total_tokens": 72797184}
{"current_steps": 2305, "total_steps": 2341, "loss": 0.6432, "learning_rate": 2.916939761009041e-08, "epoch": 0.9844117019004911, "percentage": 98.46, "elapsed_time": "17:54:45", "remaining_time": "0:16:47", "throughput": 1131.12, "total_tokens": 72941600}
{"current_steps": 2310, "total_steps": 2341, "loss": 0.5893, "learning_rate": 2.1630555950635788e-08, "epoch": 0.9865470852017937, "percentage": 98.68, "elapsed_time": "17:57:18", "remaining_time": "0:14:27", "throughput": 1131.16, "total_tokens": 73116000}
{"current_steps": 2315, "total_steps": 2341, "loss": 0.6636, "learning_rate": 1.5216317664829004e-08, "epoch": 0.9886824685030963, "percentage": 98.89, "elapsed_time": "17:59:48", "remaining_time": "0:12:07", "throughput": 1131.15, "total_tokens": 73285504}
{"current_steps": 2320, "total_steps": 2341, "loss": 0.7166, "learning_rate": 9.926971541496244e-09, "epoch": 0.9908178518043989, "percentage": 99.1, "elapsed_time": "18:02:05", "remaining_time": "0:09:47", "throughput": 1131.15, "total_tokens": 73440544}
{"current_steps": 2325, "total_steps": 2341, "loss": 0.4921, "learning_rate": 5.762755723348612e-09, "epoch": 0.9929532351057014, "percentage": 99.32, "elapsed_time": "18:03:45", "remaining_time": "0:07:27", "throughput": 1131.08, "total_tokens": 73549760}
{"current_steps": 2330, "total_steps": 2341, "loss": 0.6256, "learning_rate": 2.7238576962435034e-09, "epoch": 0.995088618407004, "percentage": 99.53, "elapsed_time": "18:06:05", "remaining_time": "0:05:07", "throughput": 1131.11, "total_tokens": 73709952}
{"current_steps": 2335, "total_steps": 2341, "loss": 0.7422, "learning_rate": 8.104142807663361e-10, "epoch": 0.9972240017083066, "percentage": 99.74, "elapsed_time": "18:08:57", "remaining_time": "0:02:47", "throughput": 1131.17, "total_tokens": 73907360}
{"current_steps": 2340, "total_steps": 2341, "loss": 0.656, "learning_rate": 2.2511626046606283e-11, "epoch": 0.9993593850096092, "percentage": 99.96, "elapsed_time": "18:11:06", "remaining_time": "0:00:27", "throughput": 1131.16, "total_tokens": 74053280}
{"current_steps": 2341, "total_steps": 2341, "epoch": 0.9997864616698697, "percentage": 100.0, "elapsed_time": "18:11:36", "remaining_time": "0:00:00", "throughput": 1131.1, "total_tokens": 74083488}
|