stackexchange_cstheory / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
bac65f2 verified
{"current_steps": 10, "total_steps": 69, "loss": 1.2052, "lr": 5e-06, "epoch": 0.42780748663101603, "percentage": 14.49, "elapsed_time": "0:09:45", "remaining_time": "0:57:31"}
{"current_steps": 20, "total_steps": 69, "loss": 1.0858, "lr": 5e-06, "epoch": 0.8556149732620321, "percentage": 28.99, "elapsed_time": "0:19:25", "remaining_time": "0:47:35"}
{"current_steps": 23, "total_steps": 69, "eval_loss": 1.0545072555541992, "epoch": 0.983957219251337, "percentage": 33.33, "elapsed_time": "0:22:59", "remaining_time": "0:45:59"}
{"current_steps": 30, "total_steps": 69, "loss": 1.1308, "lr": 5e-06, "epoch": 1.2887700534759359, "percentage": 43.48, "elapsed_time": "0:30:39", "remaining_time": "0:39:51"}
{"current_steps": 40, "total_steps": 69, "loss": 1.0111, "lr": 5e-06, "epoch": 1.7165775401069518, "percentage": 57.97, "elapsed_time": "0:40:18", "remaining_time": "0:29:13"}
{"current_steps": 46, "total_steps": 69, "eval_loss": 1.0155441761016846, "epoch": 1.9732620320855614, "percentage": 66.67, "elapsed_time": "0:46:59", "remaining_time": "0:23:29"}
{"current_steps": 50, "total_steps": 69, "loss": 1.0605, "lr": 5e-06, "epoch": 2.1497326203208558, "percentage": 72.46, "elapsed_time": "0:51:36", "remaining_time": "0:19:36"}
{"current_steps": 60, "total_steps": 69, "loss": 0.9514, "lr": 5e-06, "epoch": 2.5775401069518717, "percentage": 86.96, "elapsed_time": "1:01:17", "remaining_time": "0:09:11"}
{"current_steps": 69, "total_steps": 69, "eval_loss": 0.9938156008720398, "epoch": 2.962566844919786, "percentage": 100.0, "elapsed_time": "1:11:38", "remaining_time": "0:00:00"}
{"current_steps": 69, "total_steps": 69, "epoch": 2.962566844919786, "percentage": 100.0, "elapsed_time": "1:12:53", "remaining_time": "0:00:00"}