WordProblem / trainer_log.jsonl
pepoo20's picture
End of training
6f51c81 verified
{"current_steps": 300, "total_steps": 9120, "loss": 0.7143, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3e-05, "epoch": 0.03289383514706285, "percentage": 3.29, "elapsed_time": "0:11:46", "remaining_time": "5:46:15"}
{"current_steps": 600, "total_steps": 9120, "loss": 0.2219, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.998339850669331e-05, "epoch": 0.0657876702941257, "percentage": 6.58, "elapsed_time": "0:21:56", "remaining_time": "5:11:39"}
{"current_steps": 900, "total_steps": 9120, "loss": 0.2074, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.9734816848192624e-05, "epoch": 0.09868150544118856, "percentage": 9.87, "elapsed_time": "0:33:43", "remaining_time": "5:08:02"}
{"current_steps": 1200, "total_steps": 9120, "loss": 0.1906, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.9190839785031474e-05, "epoch": 0.1315753405882514, "percentage": 13.16, "elapsed_time": "0:43:50", "remaining_time": "4:49:22"}
{"current_steps": 1500, "total_steps": 9120, "loss": 0.1923, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.835796376008569e-05, "epoch": 0.16446917573531428, "percentage": 16.45, "elapsed_time": "0:55:43", "remaining_time": "4:43:07"}
{"current_steps": 1500, "total_steps": 9120, "loss": null, "eval_loss": 0.1849033087491989, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.16446917573531428, "percentage": 16.45, "elapsed_time": "0:55:43", "remaining_time": "4:43:07"}
{"current_steps": 1800, "total_steps": 9120, "loss": 0.1839, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.7246135390382216e-05, "epoch": 0.19736301088237712, "percentage": 19.74, "elapsed_time": "1:07:10", "remaining_time": "4:33:08"}
{"current_steps": 2100, "total_steps": 9120, "loss": 0.1938, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.586863267968384e-05, "epoch": 0.23025684602944, "percentage": 23.03, "elapsed_time": "1:19:01", "remaining_time": "4:24:08"}
{"current_steps": 2400, "total_steps": 9120, "loss": 0.1863, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.4241906446007296e-05, "epoch": 0.2631506811765028, "percentage": 26.32, "elapsed_time": "1:29:09", "remaining_time": "4:09:38"}
{"current_steps": 2700, "total_steps": 9120, "loss": 0.1797, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.238538385782601e-05, "epoch": 0.2960445163235657, "percentage": 29.61, "elapsed_time": "1:40:55", "remaining_time": "3:59:59"}
{"current_steps": 3000, "total_steps": 9120, "loss": 0.176, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.032123642522486e-05, "epoch": 0.32893835147062855, "percentage": 32.89, "elapsed_time": "1:51:07", "remaining_time": "3:46:41"}
{"current_steps": 3000, "total_steps": 9120, "loss": null, "eval_loss": 0.1760552078485489, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.32893835147062855, "percentage": 32.89, "elapsed_time": "1:51:07", "remaining_time": "3:46:41"}
{"current_steps": 3300, "total_steps": 9120, "loss": 0.1791, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.8074115216771435e-05, "epoch": 0.3618321866176914, "percentage": 36.18, "elapsed_time": "2:04:22", "remaining_time": "3:39:21"}
{"current_steps": 3600, "total_steps": 9120, "loss": 0.1808, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.567085646427478e-05, "epoch": 0.39472602176475424, "percentage": 39.47, "elapsed_time": "2:14:33", "remaining_time": "3:26:19"}
{"current_steps": 3900, "total_steps": 9120, "loss": 0.1805, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.3140161071244915e-05, "epoch": 0.4276198569118171, "percentage": 42.76, "elapsed_time": "2:26:25", "remaining_time": "3:15:58"}
{"current_steps": 4200, "total_steps": 9120, "loss": 0.1738, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 3.05122518525215e-05, "epoch": 0.46051369205888, "percentage": 46.05, "elapsed_time": "2:36:32", "remaining_time": "3:03:22"}
{"current_steps": 4500, "total_steps": 9120, "loss": 0.1736, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.781851259848554e-05, "epoch": 0.49340752720594283, "percentage": 49.34, "elapsed_time": "2:48:26", "remaining_time": "2:52:55"}
{"current_steps": 4500, "total_steps": 9120, "loss": null, "eval_loss": 0.17090687155723572, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.49340752720594283, "percentage": 49.34, "elapsed_time": "2:48:26", "remaining_time": "2:52:55"}
{"current_steps": 4800, "total_steps": 9120, "loss": 0.1709, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.509111327432736e-05, "epoch": 0.5263013623530056, "percentage": 52.63, "elapsed_time": "2:59:53", "remaining_time": "2:41:53"}
{"current_steps": 5100, "total_steps": 9120, "loss": 0.1775, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.236262583042668e-05, "epoch": 0.5591951975000685, "percentage": 55.92, "elapsed_time": "3:11:41", "remaining_time": "2:31:05"}
{"current_steps": 5400, "total_steps": 9120, "loss": 0.1759, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.966563521202681e-05, "epoch": 0.5920890326471314, "percentage": 59.21, "elapsed_time": "3:21:50", "remaining_time": "2:19:02"}
{"current_steps": 5700, "total_steps": 9120, "loss": 0.1754, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.7032350213717874e-05, "epoch": 0.6249828677941942, "percentage": 62.5, "elapsed_time": "3:33:38", "remaining_time": "2:08:11"}
{"current_steps": 6000, "total_steps": 9120, "loss": 0.1688, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.4494218826096939e-05, "epoch": 0.6578767029412571, "percentage": 65.79, "elapsed_time": "3:43:45", "remaining_time": "1:56:21"}
{"current_steps": 6000, "total_steps": 9120, "loss": null, "eval_loss": 0.16823573410511017, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.6578767029412571, "percentage": 65.79, "elapsed_time": "3:43:45", "remaining_time": "1:56:21"}
{"current_steps": 6300, "total_steps": 9120, "loss": 0.1707, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.2081552668325321e-05, "epoch": 0.6907705380883199, "percentage": 69.08, "elapsed_time": "3:57:06", "remaining_time": "1:46:08"}
{"current_steps": 6600, "total_steps": 9120, "loss": 0.171, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 9.82316499179518e-06, "epoch": 0.7236643732353828, "percentage": 72.37, "elapsed_time": "4:07:12", "remaining_time": "1:34:23"}
{"current_steps": 6900, "total_steps": 9120, "loss": 0.1702, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 7.74602657804425e-06, "epoch": 0.7565582083824457, "percentage": 75.66, "elapsed_time": "4:19:03", "remaining_time": "1:23:21"}
{"current_steps": 7200, "total_steps": 9120, "loss": 0.1718, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 5.874943640356082e-06, "epoch": 0.7894520435295085, "percentage": 78.95, "elapsed_time": "4:29:14", "remaining_time": "1:11:47"}
{"current_steps": 7500, "total_steps": 9120, "loss": 0.1689, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 4.232261575703861e-06, "epoch": 0.8223458786765714, "percentage": 82.24, "elapsed_time": "4:41:05", "remaining_time": "1:00:42"}
{"current_steps": 7500, "total_steps": 9120, "loss": null, "eval_loss": 0.16773280501365662, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.8223458786765714, "percentage": 82.24, "elapsed_time": "4:41:05", "remaining_time": "1:00:42"}
{"current_steps": 7800, "total_steps": 9120, "loss": 0.1692, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.83759810497852e-06, "epoch": 0.8552397138236342, "percentage": 85.53, "elapsed_time": "4:52:30", "remaining_time": "0:49:30"}
{"current_steps": 8100, "total_steps": 9120, "loss": 0.1787, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 1.70760898847247e-06, "epoch": 0.8881335489706971, "percentage": 88.82, "elapsed_time": "5:04:20", "remaining_time": "0:38:19"}
{"current_steps": 8400, "total_steps": 9120, "loss": 0.1733, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 8.557891145603042e-07, "epoch": 0.92102738411776, "percentage": 92.11, "elapsed_time": "5:14:28", "remaining_time": "0:26:57"}
{"current_steps": 8700, "total_steps": 9120, "loss": 0.1741, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.923113370737779e-07, "epoch": 0.9539212192648228, "percentage": 95.39, "elapsed_time": "5:26:22", "remaining_time": "0:15:45"}
{"current_steps": 9000, "total_steps": 9120, "loss": 0.168, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": 2.3904986054812396e-08, "epoch": 0.9868150544118857, "percentage": 98.68, "elapsed_time": "5:36:30", "remaining_time": "0:04:29"}
{"current_steps": 9000, "total_steps": 9120, "loss": null, "eval_loss": 0.1676628440618515, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.9868150544118857, "percentage": 98.68, "elapsed_time": "5:36:30", "remaining_time": "0:04:29"}
{"current_steps": 9120, "total_steps": 9120, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.9999725884707108, "percentage": 100.0, "elapsed_time": "5:43:04", "remaining_time": "0:00:00"}
{"current_steps": 745, "total_steps": 745, "loss": null, "eval_loss": 0.1676628440618515, "predict_loss": null, "reward": null, "accuracy": null, "learning_rate": null, "epoch": 0.9999725884707108, "percentage": 100.0, "elapsed_time": "5:44:46", "remaining_time": "0:00:00"}