STAIR-Llama-3.1-8B-DPO-3 / trainer_log.jsonl
skyai798's picture
Upload folder using huggingface_hub
3101072 verified
{"current_steps": 10, "total_steps": 357, "loss": 0.8679, "accuracy": 0.32499998807907104, "learning_rate": 1.3888888888888888e-07, "epoch": 0.0280014000700035, "percentage": 2.8, "elapsed_time": "0:03:37", "remaining_time": "2:05:54"}
{"current_steps": 20, "total_steps": 357, "loss": 0.8677, "accuracy": 0.5062500238418579, "learning_rate": 2.7777777777777776e-07, "epoch": 0.056002800140007, "percentage": 5.6, "elapsed_time": "0:07:15", "remaining_time": "2:02:17"}
{"current_steps": 30, "total_steps": 357, "loss": 0.8652, "accuracy": 0.5249999761581421, "learning_rate": 4.1666666666666667e-07, "epoch": 0.0840042002100105, "percentage": 8.4, "elapsed_time": "0:10:49", "remaining_time": "1:57:56"}
{"current_steps": 40, "total_steps": 357, "loss": 0.857, "accuracy": 0.643750011920929, "learning_rate": 4.998084579146532e-07, "epoch": 0.112005600280014, "percentage": 11.2, "elapsed_time": "0:14:25", "remaining_time": "1:54:15"}
{"current_steps": 50, "total_steps": 357, "loss": 0.8571, "accuracy": 0.5687500238418579, "learning_rate": 4.976569787782584e-07, "epoch": 0.1400070003500175, "percentage": 14.01, "elapsed_time": "0:17:56", "remaining_time": "1:50:08"}
{"current_steps": 60, "total_steps": 357, "loss": 0.8467, "accuracy": 0.550000011920929, "learning_rate": 4.931352528237397e-07, "epoch": 0.168008400420021, "percentage": 16.81, "elapsed_time": "0:21:37", "remaining_time": "1:47:03"}
{"current_steps": 70, "total_steps": 357, "loss": 0.8469, "accuracy": 0.5562499761581421, "learning_rate": 4.862865560637862e-07, "epoch": 0.1960098004900245, "percentage": 19.61, "elapsed_time": "0:25:09", "remaining_time": "1:43:07"}
{"current_steps": 80, "total_steps": 357, "loss": 0.8296, "accuracy": 0.581250011920929, "learning_rate": 4.771764352146005e-07, "epoch": 0.224011200560028, "percentage": 22.41, "elapsed_time": "0:28:46", "remaining_time": "1:39:36"}
{"current_steps": 90, "total_steps": 357, "loss": 0.8274, "accuracy": 0.574999988079071, "learning_rate": 4.658920803689553e-07, "epoch": 0.2520126006300315, "percentage": 25.21, "elapsed_time": "0:32:19", "remaining_time": "1:35:53"}
{"current_steps": 100, "total_steps": 357, "loss": 0.823, "accuracy": 0.518750011920929, "learning_rate": 4.5254149052732074e-07, "epoch": 0.280014000700035, "percentage": 28.01, "elapsed_time": "0:36:00", "remaining_time": "1:32:31"}
{"current_steps": 110, "total_steps": 357, "loss": 0.8183, "accuracy": 0.6312500238418579, "learning_rate": 4.372524399734997e-07, "epoch": 0.3080154007700385, "percentage": 30.81, "elapsed_time": "0:39:43", "remaining_time": "1:29:12"}
{"current_steps": 120, "total_steps": 357, "loss": 0.8163, "accuracy": 0.59375, "learning_rate": 4.201712553872657e-07, "epoch": 0.336016800840042, "percentage": 33.61, "elapsed_time": "0:43:24", "remaining_time": "1:25:43"}
{"current_steps": 130, "total_steps": 357, "loss": 0.8041, "accuracy": 0.625, "learning_rate": 4.014614153978704e-07, "epoch": 0.3640182009100455, "percentage": 36.41, "elapsed_time": "0:47:08", "remaining_time": "1:22:19"}
{"current_steps": 140, "total_steps": 357, "loss": 0.8088, "accuracy": 0.625, "learning_rate": 3.8130198598165444e-07, "epoch": 0.392019600980049, "percentage": 39.22, "elapsed_time": "0:50:46", "remaining_time": "1:18:42"}
{"current_steps": 150, "total_steps": 357, "loss": 0.7981, "accuracy": 0.581250011920929, "learning_rate": 3.598859066780754e-07, "epoch": 0.4200210010500525, "percentage": 42.02, "elapsed_time": "0:54:18", "remaining_time": "1:14:56"}
{"current_steps": 160, "total_steps": 357, "loss": 0.7991, "accuracy": 0.612500011920929, "learning_rate": 3.374181440262409e-07, "epoch": 0.448022401120056, "percentage": 44.82, "elapsed_time": "0:57:59", "remaining_time": "1:11:23"}
{"current_steps": 170, "total_steps": 357, "loss": 0.8001, "accuracy": 0.5874999761581421, "learning_rate": 3.14113729894821e-07, "epoch": 0.4760238011900595, "percentage": 47.62, "elapsed_time": "1:01:40", "remaining_time": "1:07:50"}
{"current_steps": 180, "total_steps": 357, "loss": 0.7937, "accuracy": 0.675000011920929, "learning_rate": 2.9019570347986706e-07, "epoch": 0.504025201260063, "percentage": 50.42, "elapsed_time": "1:05:11", "remaining_time": "1:04:06"}
{"current_steps": 190, "total_steps": 357, "loss": 0.7828, "accuracy": 0.71875, "learning_rate": 2.6589297666702654e-07, "epoch": 0.5320266013300665, "percentage": 53.22, "elapsed_time": "1:08:49", "remaining_time": "1:00:29"}
{"current_steps": 200, "total_steps": 357, "loss": 0.7841, "accuracy": 0.59375, "learning_rate": 2.414381431880974e-07, "epoch": 0.56002800140007, "percentage": 56.02, "elapsed_time": "1:12:19", "remaining_time": "0:56:46"}
{"current_steps": 210, "total_steps": 357, "loss": 0.7812, "accuracy": 0.699999988079071, "learning_rate": 2.1706525253979534e-07, "epoch": 0.5880294014700735, "percentage": 58.82, "elapsed_time": "1:15:57", "remaining_time": "0:53:10"}
{"current_steps": 220, "total_steps": 357, "loss": 0.7743, "accuracy": 0.65625, "learning_rate": 1.9300756996985379e-07, "epoch": 0.616030801540077, "percentage": 61.62, "elapsed_time": "1:19:29", "remaining_time": "0:49:30"}
{"current_steps": 230, "total_steps": 357, "loss": 0.7781, "accuracy": 0.675000011920929, "learning_rate": 1.6949534396892355e-07, "epoch": 0.6440322016100805, "percentage": 64.43, "elapsed_time": "1:23:11", "remaining_time": "0:45:56"}
{"current_steps": 240, "total_steps": 357, "loss": 0.7789, "accuracy": 0.625, "learning_rate": 1.4675360263490295e-07, "epoch": 0.672033601680084, "percentage": 67.23, "elapsed_time": "1:26:43", "remaining_time": "0:42:16"}
{"current_steps": 250, "total_steps": 357, "loss": 0.7694, "accuracy": 0.65625, "learning_rate": 1.2500000000000005e-07, "epoch": 0.7000350017500875, "percentage": 70.03, "elapsed_time": "1:30:26", "remaining_time": "0:38:42"}
{"current_steps": 260, "total_steps": 357, "loss": 0.7654, "accuracy": 0.7437499761581421, "learning_rate": 1.0444273293265149e-07, "epoch": 0.728036401820091, "percentage": 72.83, "elapsed_time": "1:34:04", "remaining_time": "0:35:05"}
{"current_steps": 270, "total_steps": 357, "loss": 0.777, "accuracy": 0.65625, "learning_rate": 8.527854855097224e-08, "epoch": 0.7560378018900945, "percentage": 75.63, "elapsed_time": "1:37:45", "remaining_time": "0:31:30"}
{"current_steps": 280, "total_steps": 357, "loss": 0.7707, "accuracy": 0.675000011920929, "learning_rate": 6.769086121815423e-08, "epoch": 0.784039201960098, "percentage": 78.43, "elapsed_time": "1:41:15", "remaining_time": "0:27:50"}
{"current_steps": 290, "total_steps": 357, "loss": 0.7698, "accuracy": 0.6499999761581421, "learning_rate": 5.184799714145557e-08, "epoch": 0.8120406020301015, "percentage": 81.23, "elapsed_time": "1:44:52", "remaining_time": "0:24:13"}
{"current_steps": 300, "total_steps": 357, "loss": 0.7656, "accuracy": 0.6875, "learning_rate": 3.790158337517127e-08, "epoch": 0.840042002100105, "percentage": 84.03, "elapsed_time": "1:48:29", "remaining_time": "0:20:36"}
{"current_steps": 310, "total_steps": 357, "loss": 0.7705, "accuracy": 0.612500011920929, "learning_rate": 2.5985096645928934e-08, "epoch": 0.8680434021701086, "percentage": 86.83, "elapsed_time": "1:52:07", "remaining_time": "0:17:00"}
{"current_steps": 320, "total_steps": 357, "loss": 0.7644, "accuracy": 0.706250011920929, "learning_rate": 1.6212585889044366e-08, "epoch": 0.896044802240112, "percentage": 89.64, "elapsed_time": "1:55:41", "remaining_time": "0:13:22"}
{"current_steps": 330, "total_steps": 357, "loss": 0.7677, "accuracy": 0.65625, "learning_rate": 8.677580722139671e-09, "epoch": 0.9240462023101155, "percentage": 92.44, "elapsed_time": "1:59:12", "remaining_time": "0:09:45"}
{"current_steps": 340, "total_steps": 357, "loss": 0.7629, "accuracy": 0.706250011920929, "learning_rate": 3.452196302677901e-09, "epoch": 0.952047602380119, "percentage": 95.24, "elapsed_time": "2:02:51", "remaining_time": "0:06:08"}
{"current_steps": 350, "total_steps": 357, "loss": 0.7734, "accuracy": 0.706250011920929, "learning_rate": 5.864431365401879e-10, "epoch": 0.9800490024501225, "percentage": 98.04, "elapsed_time": "2:06:28", "remaining_time": "0:02:31"}
{"current_steps": 357, "total_steps": 357, "epoch": 0.999649982499125, "percentage": 100.0, "elapsed_time": "2:09:21", "remaining_time": "0:00:00"}