SKNahin commited on
Commit
2371621
·
verified ·
1 Parent(s): b5ec463

Training in progress, step 3633

Browse files
Files changed (2) hide show
  1. model.safetensors +1 -1
  2. trainer_log.jsonl +125 -0
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2894bb00dd3902d4bca48e0a35496370a362f1a99b43277add0d546dddd8a04
3
  size 2471645608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a583064ae2fd08cb658e768d06456151ccdb9eaa4e0ab83b2313803804f0a4db
3
  size 2471645608
trainer_log.jsonl CHANGED
@@ -3507,3 +3507,128 @@
3507
  {"current_steps": 3507, "total_steps": 3633, "loss": 0.7718, "learning_rate": 1.2104946934673235e-07, "epoch": 0.9652514965939586, "percentage": 96.53, "elapsed_time": "9:47:58", "remaining_time": "0:21:07"}
3508
  {"current_steps": 3508, "total_steps": 3633, "loss": 0.7533, "learning_rate": 1.1913757620852562e-07, "epoch": 0.9655267322645015, "percentage": 96.56, "elapsed_time": "9:48:08", "remaining_time": "0:20:57"}
3509
  {"current_steps": 3509, "total_steps": 3633, "loss": 0.7843, "learning_rate": 1.1724085691280806e-07, "epoch": 0.9658019679350444, "percentage": 96.59, "elapsed_time": "9:48:18", "remaining_time": "0:20:47"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3507
  {"current_steps": 3507, "total_steps": 3633, "loss": 0.7718, "learning_rate": 1.2104946934673235e-07, "epoch": 0.9652514965939586, "percentage": 96.53, "elapsed_time": "9:47:58", "remaining_time": "0:21:07"}
3508
  {"current_steps": 3508, "total_steps": 3633, "loss": 0.7533, "learning_rate": 1.1913757620852562e-07, "epoch": 0.9655267322645015, "percentage": 96.56, "elapsed_time": "9:48:08", "remaining_time": "0:20:57"}
3509
  {"current_steps": 3509, "total_steps": 3633, "loss": 0.7843, "learning_rate": 1.1724085691280806e-07, "epoch": 0.9658019679350444, "percentage": 96.59, "elapsed_time": "9:48:18", "remaining_time": "0:20:47"}
3510
+ {"current_steps": 3510, "total_steps": 3633, "loss": 0.7836, "learning_rate": 1.1535931290723057e-07, "epoch": 0.9660772036055872, "percentage": 96.61, "elapsed_time": "9:48:28", "remaining_time": "0:20:37"}
3511
+ {"current_steps": 3511, "total_steps": 3633, "loss": 0.7488, "learning_rate": 1.1349294562786217e-07, "epoch": 0.9663524392761302, "percentage": 96.64, "elapsed_time": "9:48:38", "remaining_time": "0:20:27"}
3512
+ {"current_steps": 3512, "total_steps": 3633, "loss": 0.7714, "learning_rate": 1.1164175649918341e-07, "epoch": 0.9666276749466731, "percentage": 96.67, "elapsed_time": "9:48:48", "remaining_time": "0:20:17"}
3513
+ {"current_steps": 3513, "total_steps": 3633, "loss": 0.7283, "learning_rate": 1.0980574693409295e-07, "epoch": 0.966902910617216, "percentage": 96.7, "elapsed_time": "9:48:58", "remaining_time": "0:20:07"}
3514
+ {"current_steps": 3514, "total_steps": 3633, "loss": 0.7777, "learning_rate": 1.0798491833390767e-07, "epoch": 0.9671781462877589, "percentage": 96.72, "elapsed_time": "9:49:08", "remaining_time": "0:19:57"}
3515
+ {"current_steps": 3515, "total_steps": 3633, "loss": 0.7573, "learning_rate": 1.0617927208835143e-07, "epoch": 0.9674533819583018, "percentage": 96.75, "elapsed_time": "9:49:18", "remaining_time": "0:19:47"}
3516
+ {"current_steps": 3516, "total_steps": 3633, "loss": 0.7675, "learning_rate": 1.0438880957556408e-07, "epoch": 0.9677286176288447, "percentage": 96.78, "elapsed_time": "9:49:28", "remaining_time": "0:19:36"}
3517
+ {"current_steps": 3517, "total_steps": 3633, "loss": 0.7666, "learning_rate": 1.0261353216209691e-07, "epoch": 0.9680038532993877, "percentage": 96.81, "elapsed_time": "9:49:38", "remaining_time": "0:19:26"}
3518
+ {"current_steps": 3518, "total_steps": 3633, "loss": 0.8104, "learning_rate": 1.008534412029083e-07, "epoch": 0.9682790889699305, "percentage": 96.83, "elapsed_time": "9:49:48", "remaining_time": "0:19:16"}
3519
+ {"current_steps": 3519, "total_steps": 3633, "loss": 0.7596, "learning_rate": 9.910853804137033e-08, "epoch": 0.9685543246404734, "percentage": 96.86, "elapsed_time": "9:49:58", "remaining_time": "0:19:06"}
3520
+ {"current_steps": 3520, "total_steps": 3633, "loss": 0.7746, "learning_rate": 9.737882400925768e-08, "epoch": 0.9688295603110163, "percentage": 96.89, "elapsed_time": "9:50:08", "remaining_time": "0:18:56"}
3521
+ {"current_steps": 3521, "total_steps": 3633, "loss": 0.741, "learning_rate": 9.566430042675657e-08, "epoch": 0.9691047959815592, "percentage": 96.92, "elapsed_time": "9:50:18", "remaining_time": "0:18:46"}
3522
+ {"current_steps": 3522, "total_steps": 3633, "loss": 0.7662, "learning_rate": 9.396496860245797e-08, "epoch": 0.9693800316521021, "percentage": 96.94, "elapsed_time": "9:50:28", "remaining_time": "0:18:36"}
3523
+ {"current_steps": 3523, "total_steps": 3633, "loss": 0.7685, "learning_rate": 9.228082983335329e-08, "epoch": 0.9696552673226451, "percentage": 96.97, "elapsed_time": "9:50:38", "remaining_time": "0:18:26"}
3524
+ {"current_steps": 3524, "total_steps": 3633, "loss": 0.7515, "learning_rate": 9.061188540484989e-08, "epoch": 0.969930502993188, "percentage": 97.0, "elapsed_time": "9:50:48", "remaining_time": "0:18:16"}
3525
+ {"current_steps": 3525, "total_steps": 3633, "loss": 0.8175, "learning_rate": 8.895813659074437e-08, "epoch": 0.9702057386637308, "percentage": 97.03, "elapsed_time": "9:50:59", "remaining_time": "0:18:06"}
3526
+ {"current_steps": 3526, "total_steps": 3633, "loss": 0.755, "learning_rate": 8.731958465324486e-08, "epoch": 0.9704809743342737, "percentage": 97.05, "elapsed_time": "9:51:09", "remaining_time": "0:17:56"}
3527
+ {"current_steps": 3527, "total_steps": 3633, "loss": 0.7545, "learning_rate": 8.569623084295541e-08, "epoch": 0.9707562100048166, "percentage": 97.08, "elapsed_time": "9:51:19", "remaining_time": "0:17:46"}
3528
+ {"current_steps": 3528, "total_steps": 3633, "loss": 0.7656, "learning_rate": 8.408807639888494e-08, "epoch": 0.9710314456753595, "percentage": 97.11, "elapsed_time": "9:51:29", "remaining_time": "0:17:36"}
3529
+ {"current_steps": 3529, "total_steps": 3633, "loss": 0.7861, "learning_rate": 8.249512254843827e-08, "epoch": 0.9713066813459025, "percentage": 97.14, "elapsed_time": "9:51:39", "remaining_time": "0:17:26"}
3530
+ {"current_steps": 3530, "total_steps": 3633, "loss": 0.7782, "learning_rate": 8.091737050741621e-08, "epoch": 0.9715819170164454, "percentage": 97.16, "elapsed_time": "9:51:49", "remaining_time": "0:17:16"}
3531
+ {"current_steps": 3531, "total_steps": 3633, "loss": 0.7597, "learning_rate": 7.93548214800266e-08, "epoch": 0.9718571526869882, "percentage": 97.19, "elapsed_time": "9:51:58", "remaining_time": "0:17:06"}
3532
+ {"current_steps": 3532, "total_steps": 3633, "loss": 0.7466, "learning_rate": 7.78074766588599e-08, "epoch": 0.9721323883575311, "percentage": 97.22, "elapsed_time": "9:52:09", "remaining_time": "0:16:55"}
3533
+ {"current_steps": 3533, "total_steps": 3633, "loss": 0.7701, "learning_rate": 7.627533722491364e-08, "epoch": 0.972407624028074, "percentage": 97.25, "elapsed_time": "9:52:19", "remaining_time": "0:16:45"}
3534
+ {"current_steps": 3534, "total_steps": 3633, "loss": 0.7604, "learning_rate": 7.475840434757686e-08, "epoch": 0.9726828596986169, "percentage": 97.27, "elapsed_time": "9:52:29", "remaining_time": "0:16:35"}
3535
+ {"current_steps": 3535, "total_steps": 3633, "loss": 0.7608, "learning_rate": 7.325667918462787e-08, "epoch": 0.9729580953691599, "percentage": 97.3, "elapsed_time": "9:52:39", "remaining_time": "0:16:25"}
3536
+ {"current_steps": 3536, "total_steps": 3633, "loss": 0.7865, "learning_rate": 7.177016288224315e-08, "epoch": 0.9732333310397028, "percentage": 97.33, "elapsed_time": "9:52:49", "remaining_time": "0:16:15"}
3537
+ {"current_steps": 3537, "total_steps": 3633, "loss": 0.7647, "learning_rate": 7.02988565749907e-08, "epoch": 0.9735085667102457, "percentage": 97.36, "elapsed_time": "9:52:59", "remaining_time": "0:16:05"}
3538
+ {"current_steps": 3538, "total_steps": 3633, "loss": 0.8035, "learning_rate": 6.884276138582557e-08, "epoch": 0.9737838023807885, "percentage": 97.39, "elapsed_time": "9:53:09", "remaining_time": "0:15:55"}
3539
+ {"current_steps": 3539, "total_steps": 3633, "loss": 0.77, "learning_rate": 6.74018784260988e-08, "epoch": 0.9740590380513314, "percentage": 97.41, "elapsed_time": "9:53:19", "remaining_time": "0:15:45"}
3540
+ {"current_steps": 3540, "total_steps": 3633, "loss": 0.787, "learning_rate": 6.597620879554623e-08, "epoch": 0.9743342737218743, "percentage": 97.44, "elapsed_time": "9:53:29", "remaining_time": "0:15:35"}
3541
+ {"current_steps": 3541, "total_steps": 3633, "loss": 0.7558, "learning_rate": 6.4565753582293e-08, "epoch": 0.9746095093924173, "percentage": 97.47, "elapsed_time": "9:53:39", "remaining_time": "0:15:25"}
3542
+ {"current_steps": 3542, "total_steps": 3633, "loss": 0.7744, "learning_rate": 6.317051386285356e-08, "epoch": 0.9748847450629602, "percentage": 97.5, "elapsed_time": "9:53:49", "remaining_time": "0:15:15"}
3543
+ {"current_steps": 3543, "total_steps": 3633, "loss": 0.7987, "learning_rate": 6.179049070213161e-08, "epoch": 0.9751599807335031, "percentage": 97.52, "elapsed_time": "9:53:59", "remaining_time": "0:15:05"}
3544
+ {"current_steps": 3544, "total_steps": 3633, "loss": 0.766, "learning_rate": 6.04256851534113e-08, "epoch": 0.975435216404046, "percentage": 97.55, "elapsed_time": "9:54:09", "remaining_time": "0:14:55"}
3545
+ {"current_steps": 3545, "total_steps": 3633, "loss": 0.7655, "learning_rate": 5.90760982583638e-08, "epoch": 0.9757104520745888, "percentage": 97.58, "elapsed_time": "9:54:19", "remaining_time": "0:14:45"}
3546
+ {"current_steps": 3546, "total_steps": 3633, "loss": 0.7916, "learning_rate": 5.774173104705183e-08, "epoch": 0.9759856877451317, "percentage": 97.61, "elapsed_time": "9:54:29", "remaining_time": "0:14:35"}
3547
+ {"current_steps": 3547, "total_steps": 3633, "loss": 0.7453, "learning_rate": 5.642258453790961e-08, "epoch": 0.9762609234156747, "percentage": 97.63, "elapsed_time": "9:54:39", "remaining_time": "0:14:25"}
3548
+ {"current_steps": 3548, "total_steps": 3633, "loss": 0.7406, "learning_rate": 5.511865973776287e-08, "epoch": 0.9765361590862176, "percentage": 97.66, "elapsed_time": "9:54:49", "remaining_time": "0:14:15"}
3549
+ {"current_steps": 3549, "total_steps": 3633, "loss": 0.7565, "learning_rate": 5.382995764181775e-08, "epoch": 0.9768113947567605, "percentage": 97.69, "elapsed_time": "9:54:59", "remaining_time": "0:14:04"}
3550
+ {"current_steps": 3550, "total_steps": 3633, "loss": 0.7611, "learning_rate": 5.2556479233663026e-08, "epoch": 0.9770866304273034, "percentage": 97.72, "elapsed_time": "9:55:09", "remaining_time": "0:13:54"}
3551
+ {"current_steps": 3551, "total_steps": 3633, "loss": 0.7545, "learning_rate": 5.129822548526342e-08, "epoch": 0.9773618660978463, "percentage": 97.74, "elapsed_time": "9:55:20", "remaining_time": "0:13:44"}
3552
+ {"current_steps": 3552, "total_steps": 3633, "loss": 0.7479, "learning_rate": 5.005519735696851e-08, "epoch": 0.9776371017683891, "percentage": 97.77, "elapsed_time": "9:55:30", "remaining_time": "0:13:34"}
3553
+ {"current_steps": 3553, "total_steps": 3633, "loss": 0.7672, "learning_rate": 4.882739579750606e-08, "epoch": 0.9779123374389321, "percentage": 97.8, "elapsed_time": "9:55:40", "remaining_time": "0:13:24"}
3554
+ {"current_steps": 3554, "total_steps": 3633, "loss": 0.7813, "learning_rate": 4.761482174398202e-08, "epoch": 0.978187573109475, "percentage": 97.83, "elapsed_time": "9:55:50", "remaining_time": "0:13:14"}
3555
+ {"current_steps": 3555, "total_steps": 3633, "loss": 0.7656, "learning_rate": 4.641747612187608e-08, "epoch": 0.9784628087800179, "percentage": 97.85, "elapsed_time": "9:56:00", "remaining_time": "0:13:04"}
3556
+ {"current_steps": 3556, "total_steps": 3633, "loss": 0.7694, "learning_rate": 4.523535984505278e-08, "epoch": 0.9787380444505608, "percentage": 97.88, "elapsed_time": "9:56:10", "remaining_time": "0:12:54"}
3557
+ {"current_steps": 3557, "total_steps": 3633, "loss": 0.7762, "learning_rate": 4.406847381574819e-08, "epoch": 0.9790132801211037, "percentage": 97.91, "elapsed_time": "9:56:20", "remaining_time": "0:12:44"}
3558
+ {"current_steps": 3558, "total_steps": 3633, "loss": 0.7646, "learning_rate": 4.291681892457211e-08, "epoch": 0.9792885157916466, "percentage": 97.94, "elapsed_time": "9:56:30", "remaining_time": "0:12:34"}
3559
+ {"current_steps": 3559, "total_steps": 3633, "loss": 0.7883, "learning_rate": 4.178039605051698e-08, "epoch": 0.9795637514621895, "percentage": 97.96, "elapsed_time": "9:56:40", "remaining_time": "0:12:24"}
3560
+ {"current_steps": 3560, "total_steps": 3633, "loss": 0.7636, "learning_rate": 4.065920606093787e-08, "epoch": 0.9798389871327324, "percentage": 97.99, "elapsed_time": "9:56:50", "remaining_time": "0:12:14"}
3561
+ {"current_steps": 3561, "total_steps": 3633, "loss": 0.7775, "learning_rate": 3.9553249811576936e-08, "epoch": 0.9801142228032753, "percentage": 98.02, "elapsed_time": "9:57:00", "remaining_time": "0:12:04"}
3562
+ {"current_steps": 3562, "total_steps": 3633, "loss": 0.7571, "learning_rate": 3.846252814654117e-08, "epoch": 0.9803894584738182, "percentage": 98.05, "elapsed_time": "9:57:10", "remaining_time": "0:11:54"}
3563
+ {"current_steps": 3563, "total_steps": 3633, "loss": 0.7679, "learning_rate": 3.738704189830689e-08, "epoch": 0.9806646941443611, "percentage": 98.07, "elapsed_time": "9:57:20", "remaining_time": "0:11:44"}
3564
+ {"current_steps": 3564, "total_steps": 3633, "loss": 0.7684, "learning_rate": 3.632679188773303e-08, "epoch": 0.980939929814904, "percentage": 98.1, "elapsed_time": "9:57:30", "remaining_time": "0:11:34"}
3565
+ {"current_steps": 3565, "total_steps": 3633, "loss": 0.8016, "learning_rate": 3.528177892403894e-08, "epoch": 0.981215165485447, "percentage": 98.13, "elapsed_time": "9:57:40", "remaining_time": "0:11:24"}
3566
+ {"current_steps": 3566, "total_steps": 3633, "loss": 0.7641, "learning_rate": 3.425200380481997e-08, "epoch": 0.9814904011559898, "percentage": 98.16, "elapsed_time": "9:57:50", "remaining_time": "0:11:13"}
3567
+ {"current_steps": 3567, "total_steps": 3633, "loss": 0.7578, "learning_rate": 3.3237467316042937e-08, "epoch": 0.9817656368265327, "percentage": 98.18, "elapsed_time": "9:58:00", "remaining_time": "0:11:03"}
3568
+ {"current_steps": 3568, "total_steps": 3633, "loss": 0.7832, "learning_rate": 3.2238170232037346e-08, "epoch": 0.9820408724970756, "percentage": 98.21, "elapsed_time": "9:58:10", "remaining_time": "0:10:53"}
3569
+ {"current_steps": 3569, "total_steps": 3633, "loss": 0.7526, "learning_rate": 3.125411331550643e-08, "epoch": 0.9823161081676185, "percentage": 98.24, "elapsed_time": "9:58:20", "remaining_time": "0:10:43"}
3570
+ {"current_steps": 3570, "total_steps": 3633, "loss": 0.754, "learning_rate": 3.028529731752272e-08, "epoch": 0.9825913438381614, "percentage": 98.27, "elapsed_time": "9:58:30", "remaining_time": "0:10:33"}
3571
+ {"current_steps": 3571, "total_steps": 3633, "loss": 0.7554, "learning_rate": 2.9331722977523625e-08, "epoch": 0.9828665795087044, "percentage": 98.29, "elapsed_time": "9:58:41", "remaining_time": "0:10:23"}
3572
+ {"current_steps": 3572, "total_steps": 3633, "loss": 0.759, "learning_rate": 2.83933910233114e-08, "epoch": 0.9831418151792473, "percentage": 98.32, "elapsed_time": "9:58:51", "remaining_time": "0:10:13"}
3573
+ {"current_steps": 3573, "total_steps": 3633, "loss": 0.7384, "learning_rate": 2.7470302171057616e-08, "epoch": 0.9834170508497901, "percentage": 98.35, "elapsed_time": "9:59:01", "remaining_time": "0:10:03"}
3574
+ {"current_steps": 3574, "total_steps": 3633, "loss": 0.7616, "learning_rate": 2.6562457125300922e-08, "epoch": 0.983692286520333, "percentage": 98.38, "elapsed_time": "9:59:11", "remaining_time": "0:09:53"}
3575
+ {"current_steps": 3575, "total_steps": 3633, "loss": 0.7653, "learning_rate": 2.566985657894483e-08, "epoch": 0.9839675221908759, "percentage": 98.4, "elapsed_time": "9:59:21", "remaining_time": "0:09:43"}
3576
+ {"current_steps": 3576, "total_steps": 3633, "loss": 0.7548, "learning_rate": 2.4792501213253272e-08, "epoch": 0.9842427578614188, "percentage": 98.43, "elapsed_time": "9:59:31", "remaining_time": "0:09:33"}
3577
+ {"current_steps": 3577, "total_steps": 3633, "loss": 0.7847, "learning_rate": 2.393039169785949e-08, "epoch": 0.9845179935319618, "percentage": 98.46, "elapsed_time": "9:59:41", "remaining_time": "0:09:23"}
3578
+ {"current_steps": 3578, "total_steps": 3633, "loss": 0.7577, "learning_rate": 2.308352869075936e-08, "epoch": 0.9847932292025047, "percentage": 98.49, "elapsed_time": "9:59:51", "remaining_time": "0:09:13"}
3579
+ {"current_steps": 3579, "total_steps": 3633, "loss": 0.7698, "learning_rate": 2.2251912838311408e-08, "epoch": 0.9850684648730476, "percentage": 98.51, "elapsed_time": "10:00:01", "remaining_time": "0:09:03"}
3580
+ {"current_steps": 3580, "total_steps": 3633, "loss": 0.772, "learning_rate": 2.1435544775234574e-08, "epoch": 0.9853437005435904, "percentage": 98.54, "elapsed_time": "10:00:11", "remaining_time": "0:08:53"}
3581
+ {"current_steps": 3581, "total_steps": 3633, "loss": 0.7903, "learning_rate": 2.0634425124614886e-08, "epoch": 0.9856189362141333, "percentage": 98.57, "elapsed_time": "10:00:21", "remaining_time": "0:08:43"}
3582
+ {"current_steps": 3582, "total_steps": 3633, "loss": 0.7519, "learning_rate": 1.98485544978988e-08, "epoch": 0.9858941718846762, "percentage": 98.6, "elapsed_time": "10:00:31", "remaining_time": "0:08:33"}
3583
+ {"current_steps": 3583, "total_steps": 3633, "loss": 0.7709, "learning_rate": 1.9077933494888733e-08, "epoch": 0.9861694075552192, "percentage": 98.62, "elapsed_time": "10:00:41", "remaining_time": "0:08:22"}
3584
+ {"current_steps": 3584, "total_steps": 3633, "loss": 0.7524, "learning_rate": 1.8322562703758652e-08, "epoch": 0.9864446432257621, "percentage": 98.65, "elapsed_time": "10:00:51", "remaining_time": "0:08:12"}
3585
+ {"current_steps": 3585, "total_steps": 3633, "loss": 0.7555, "learning_rate": 1.758244270103182e-08, "epoch": 0.986719878896305, "percentage": 98.68, "elapsed_time": "10:01:01", "remaining_time": "0:08:02"}
3586
+ {"current_steps": 3586, "total_steps": 3633, "loss": 0.7536, "learning_rate": 1.68575740515986e-08, "epoch": 0.9869951145668479, "percentage": 98.71, "elapsed_time": "10:01:11", "remaining_time": "0:07:52"}
3587
+ {"current_steps": 3587, "total_steps": 3633, "loss": 0.7884, "learning_rate": 1.614795730870311e-08, "epoch": 0.9872703502373907, "percentage": 98.73, "elapsed_time": "10:01:22", "remaining_time": "0:07:42"}
3588
+ {"current_steps": 3588, "total_steps": 3633, "loss": 0.7498, "learning_rate": 1.545359301395877e-08, "epoch": 0.9875455859079336, "percentage": 98.76, "elapsed_time": "10:01:32", "remaining_time": "0:07:32"}
3589
+ {"current_steps": 3589, "total_steps": 3633, "loss": 0.7754, "learning_rate": 1.4774481697326093e-08, "epoch": 0.9878208215784766, "percentage": 98.79, "elapsed_time": "10:01:42", "remaining_time": "0:07:22"}
3590
+ {"current_steps": 3590, "total_steps": 3633, "loss": 0.7665, "learning_rate": 1.411062387713269e-08, "epoch": 0.9880960572490195, "percentage": 98.82, "elapsed_time": "10:01:52", "remaining_time": "0:07:12"}
3591
+ {"current_steps": 3591, "total_steps": 3633, "loss": 0.7732, "learning_rate": 1.3462020060057701e-08, "epoch": 0.9883712929195624, "percentage": 98.84, "elapsed_time": "10:02:02", "remaining_time": "0:07:02"}
3592
+ {"current_steps": 3592, "total_steps": 3633, "loss": 0.7695, "learning_rate": 1.2828670741140693e-08, "epoch": 0.9886465285901053, "percentage": 98.87, "elapsed_time": "10:02:12", "remaining_time": "0:06:52"}
3593
+ {"current_steps": 3593, "total_steps": 3633, "loss": 0.7936, "learning_rate": 1.2210576403779428e-08, "epoch": 0.9889217642606482, "percentage": 98.9, "elapsed_time": "10:02:22", "remaining_time": "0:06:42"}
3594
+ {"current_steps": 3594, "total_steps": 3633, "loss": 0.7464, "learning_rate": 1.1607737519727658e-08, "epoch": 0.989196999931191, "percentage": 98.93, "elapsed_time": "10:02:32", "remaining_time": "0:06:32"}
3595
+ {"current_steps": 3595, "total_steps": 3633, "loss": 0.7372, "learning_rate": 1.1020154549095108e-08, "epoch": 0.989472235601734, "percentage": 98.95, "elapsed_time": "10:02:42", "remaining_time": "0:06:22"}
3596
+ {"current_steps": 3596, "total_steps": 3633, "loss": 0.7577, "learning_rate": 1.0447827940345268e-08, "epoch": 0.9897474712722769, "percentage": 98.98, "elapsed_time": "10:02:52", "remaining_time": "0:06:12"}
3597
+ {"current_steps": 3597, "total_steps": 3633, "loss": 0.7566, "learning_rate": 9.890758130304268e-09, "epoch": 0.9900227069428198, "percentage": 99.01, "elapsed_time": "10:03:02", "remaining_time": "0:06:02"}
3598
+ {"current_steps": 3598, "total_steps": 3633, "loss": 0.7877, "learning_rate": 9.348945544147558e-09, "epoch": 0.9902979426133627, "percentage": 99.04, "elapsed_time": "10:03:12", "remaining_time": "0:05:52"}
3599
+ {"current_steps": 3599, "total_steps": 3633, "loss": 0.7832, "learning_rate": 8.822390595404352e-09, "epoch": 0.9905731782839056, "percentage": 99.06, "elapsed_time": "10:03:22", "remaining_time": "0:05:42"}
3600
+ {"current_steps": 3600, "total_steps": 3633, "loss": 0.7779, "learning_rate": 8.311093685966498e-09, "epoch": 0.9908484139544484, "percentage": 99.09, "elapsed_time": "10:03:32", "remaining_time": "0:05:31"}
3601
+ {"current_steps": 3601, "total_steps": 3633, "loss": 0.7878, "learning_rate": 7.815055206072952e-09, "epoch": 0.9911236496249914, "percentage": 99.12, "elapsed_time": "10:03:42", "remaining_time": "0:05:21"}
3602
+ {"current_steps": 3602, "total_steps": 3633, "loss": 0.7653, "learning_rate": 7.3342755343208674e-09, "epoch": 0.9913988852955343, "percentage": 99.15, "elapsed_time": "10:03:52", "remaining_time": "0:05:11"}
3603
+ {"current_steps": 3603, "total_steps": 3633, "loss": 0.7767, "learning_rate": 6.868755037658937e-09, "epoch": 0.9916741209660772, "percentage": 99.17, "elapsed_time": "10:04:02", "remaining_time": "0:05:01"}
3604
+ {"current_steps": 3604, "total_steps": 3633, "loss": 0.7746, "learning_rate": 6.418494071389614e-09, "epoch": 0.9919493566366201, "percentage": 99.2, "elapsed_time": "10:04:12", "remaining_time": "0:04:51"}
3605
+ {"current_steps": 3605, "total_steps": 3633, "loss": 0.7788, "learning_rate": 5.983492979171335e-09, "epoch": 0.992224592307163, "percentage": 99.23, "elapsed_time": "10:04:22", "remaining_time": "0:04:41"}
3606
+ {"current_steps": 3606, "total_steps": 3633, "loss": 0.7624, "learning_rate": 5.563752093011854e-09, "epoch": 0.9924998279777059, "percentage": 99.26, "elapsed_time": "10:04:32", "remaining_time": "0:04:31"}
3607
+ {"current_steps": 3607, "total_steps": 3633, "loss": 0.786, "learning_rate": 5.159271733274907e-09, "epoch": 0.9927750636482489, "percentage": 99.28, "elapsed_time": "10:04:42", "remaining_time": "0:04:21"}
3608
+ {"current_steps": 3608, "total_steps": 3633, "loss": 0.7738, "learning_rate": 4.770052208673548e-09, "epoch": 0.9930502993187917, "percentage": 99.31, "elapsed_time": "10:04:52", "remaining_time": "0:04:11"}
3609
+ {"current_steps": 3609, "total_steps": 3633, "loss": 0.7707, "learning_rate": 4.396093816279035e-09, "epoch": 0.9933255349893346, "percentage": 99.34, "elapsed_time": "10:05:03", "remaining_time": "0:04:01"}
3610
+ {"current_steps": 3610, "total_steps": 3633, "loss": 0.7575, "learning_rate": 4.037396841507501e-09, "epoch": 0.9936007706598775, "percentage": 99.37, "elapsed_time": "10:05:13", "remaining_time": "0:03:51"}
3611
+ {"current_steps": 3611, "total_steps": 3633, "loss": 0.7731, "learning_rate": 3.693961558131065e-09, "epoch": 0.9938760063304204, "percentage": 99.39, "elapsed_time": "10:05:23", "remaining_time": "0:03:41"}
3612
+ {"current_steps": 3612, "total_steps": 3633, "loss": 0.7573, "learning_rate": 3.3657882282733812e-09, "epoch": 0.9941512420009633, "percentage": 99.42, "elapsed_time": "10:05:33", "remaining_time": "0:03:31"}
3613
+ {"current_steps": 3613, "total_steps": 3633, "loss": 0.7718, "learning_rate": 3.052877102409646e-09, "epoch": 0.9944264776715063, "percentage": 99.45, "elapsed_time": "10:05:43", "remaining_time": "0:03:21"}
3614
+ {"current_steps": 3614, "total_steps": 3633, "loss": 0.8098, "learning_rate": 2.755228419364375e-09, "epoch": 0.9947017133420492, "percentage": 99.48, "elapsed_time": "10:05:53", "remaining_time": "0:03:11"}
3615
+ {"current_steps": 3615, "total_steps": 3633, "loss": 0.7667, "learning_rate": 2.472842406315845e-09, "epoch": 0.994976949012592, "percentage": 99.5, "elapsed_time": "10:06:03", "remaining_time": "0:03:01"}
3616
+ {"current_steps": 3616, "total_steps": 3633, "loss": 0.747, "learning_rate": 2.205719278789431e-09, "epoch": 0.9952521846831349, "percentage": 99.53, "elapsed_time": "10:06:13", "remaining_time": "0:02:51"}
3617
+ {"current_steps": 3617, "total_steps": 3633, "loss": 0.7664, "learning_rate": 1.9538592406664892e-09, "epoch": 0.9955274203536778, "percentage": 99.56, "elapsed_time": "10:06:23", "remaining_time": "0:02:40"}
3618
+ {"current_steps": 3618, "total_steps": 3633, "loss": 0.7929, "learning_rate": 1.7172624841754748e-09, "epoch": 0.9958026560242207, "percentage": 99.59, "elapsed_time": "10:06:33", "remaining_time": "0:02:30"}
3619
+ {"current_steps": 3619, "total_steps": 3633, "loss": 0.745, "learning_rate": 1.4959291898963836e-09, "epoch": 0.9960778916947637, "percentage": 99.61, "elapsed_time": "10:06:43", "remaining_time": "0:02:20"}
3620
+ {"current_steps": 3620, "total_steps": 3633, "loss": 0.7756, "learning_rate": 1.2898595267585301e-09, "epoch": 0.9963531273653066, "percentage": 99.64, "elapsed_time": "10:06:53", "remaining_time": "0:02:10"}
3621
+ {"current_steps": 3621, "total_steps": 3633, "loss": 0.7875, "learning_rate": 1.0990536520427696e-09, "epoch": 0.9966283630358495, "percentage": 99.67, "elapsed_time": "10:07:03", "remaining_time": "0:02:00"}
3622
+ {"current_steps": 3622, "total_steps": 3633, "loss": 0.7447, "learning_rate": 9.235117113792768e-10, "epoch": 0.9969035987063923, "percentage": 99.7, "elapsed_time": "10:07:13", "remaining_time": "0:01:50"}
3623
+ {"current_steps": 3623, "total_steps": 3633, "loss": 0.7855, "learning_rate": 7.632338387497662e-10, "epoch": 0.9971788343769352, "percentage": 99.72, "elapsed_time": "10:07:23", "remaining_time": "0:01:40"}
3624
+ {"current_steps": 3624, "total_steps": 3633, "loss": 0.7556, "learning_rate": 6.182201564830514e-10, "epoch": 0.9974540700474781, "percentage": 99.75, "elapsed_time": "10:07:33", "remaining_time": "0:01:30"}
3625
+ {"current_steps": 3625, "total_steps": 3633, "loss": 0.7673, "learning_rate": 4.884707752594864e-10, "epoch": 0.9977293057180211, "percentage": 99.78, "elapsed_time": "10:07:43", "remaining_time": "0:01:20"}
3626
+ {"current_steps": 3626, "total_steps": 3633, "loss": 0.7606, "learning_rate": 3.739857941087444e-10, "epoch": 0.998004541388564, "percentage": 99.81, "elapsed_time": "10:07:53", "remaining_time": "0:01:10"}
3627
+ {"current_steps": 3627, "total_steps": 3633, "loss": 0.7782, "learning_rate": 2.747653004098183e-10, "epoch": 0.9982797770591069, "percentage": 99.83, "elapsed_time": "10:08:03", "remaining_time": "0:01:00"}
3628
+ {"current_steps": 3628, "total_steps": 3633, "loss": 0.7419, "learning_rate": 1.9080936989324117e-10, "epoch": 0.9985550127296497, "percentage": 99.86, "elapsed_time": "10:08:13", "remaining_time": "0:00:50"}
3629
+ {"current_steps": 3629, "total_steps": 3633, "loss": 0.7561, "learning_rate": 1.221180666344246e-10, "epoch": 0.9988302484001926, "percentage": 99.89, "elapsed_time": "10:08:23", "remaining_time": "0:00:40"}
3630
+ {"current_steps": 3630, "total_steps": 3633, "loss": 0.7399, "learning_rate": 6.869144306476117e-11, "epoch": 0.9991054840707355, "percentage": 99.92, "elapsed_time": "10:08:33", "remaining_time": "0:00:30"}
3631
+ {"current_steps": 3631, "total_steps": 3633, "loss": 0.7566, "learning_rate": 3.0529539960522104e-11, "epoch": 0.9993807197412785, "percentage": 99.94, "elapsed_time": "10:08:44", "remaining_time": "0:00:20"}
3632
+ {"current_steps": 3632, "total_steps": 3633, "loss": 0.7667, "learning_rate": 7.632386447298245e-12, "epoch": 0.9996559554118214, "percentage": 99.97, "elapsed_time": "10:08:54", "remaining_time": "0:00:10"}
3633
+ {"current_steps": 3633, "total_steps": 3633, "loss": 0.7571, "learning_rate": 0.0, "epoch": 0.9999311910823643, "percentage": 100.0, "elapsed_time": "10:09:04", "remaining_time": "0:00:00"}
3634
+ {"current_steps": 3633, "total_steps": 3633, "epoch": 0.9999311910823643, "percentage": 100.0, "elapsed_time": "10:09:10", "remaining_time": "0:00:00"}