{ "best_metric": 0.9180412395863843, "best_model_checkpoint": "/home/hoan/projects/nsfw/models/efficientvit_l1.r224_in1k/run-cpz6d1iz/checkpoint-616", "epoch": 29.647058823529413, "eval_steps": 500, "global_step": 630, "is_hyper_param_search": true, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.61, "learning_rate": 9.337297572513965e-06, "loss": 1.4974, "step": 13 }, { "epoch": 0.99, "eval_accuracy": 0.8245565410199557, "eval_f1": 0.7504652622410692, "eval_loss": 1.1778662204742432, "eval_precision": 0.7010977125485033, "eval_recall": 0.8245565410199557, "eval_runtime": 7.9368, "eval_samples_per_second": 454.594, "eval_steps_per_second": 3.654, "step": 21 }, { "epoch": 1.22, "learning_rate": 1.867459514502793e-05, "loss": 1.2529, "step": 26 }, { "epoch": 1.84, "learning_rate": 2.8011892717541894e-05, "loss": 0.9843, "step": 39 }, { "epoch": 1.98, "eval_accuracy": 0.8323170731707317, "eval_f1": 0.7607906844449553, "eval_loss": 0.9312257170677185, "eval_precision": 0.7813901035438382, "eval_recall": 0.8323170731707317, "eval_runtime": 7.8479, "eval_samples_per_second": 459.738, "eval_steps_per_second": 3.695, "step": 42 }, { "epoch": 2.45, "learning_rate": 3.734919029005586e-05, "loss": 0.9036, "step": 52 }, { "epoch": 2.96, "eval_accuracy": 0.8852549889135255, "eval_f1": 0.8727382252421404, "eval_loss": 0.8863803744316101, "eval_precision": 0.8818471384989105, "eval_recall": 0.8852549889135255, "eval_runtime": 8.2029, "eval_samples_per_second": 439.844, "eval_steps_per_second": 3.535, "step": 63 }, { "epoch": 3.06, "learning_rate": 4.668648786256983e-05, "loss": 0.8702, "step": 65 }, { "epoch": 3.67, "learning_rate": 5.602378543508379e-05, "loss": 0.8272, "step": 78 }, { "epoch": 4.0, "eval_accuracy": 0.9088137472283814, "eval_f1": 0.9016044442281315, "eval_loss": 0.827029824256897, "eval_precision": 0.8977767175054678, "eval_recall": 0.9088137472283814, "eval_runtime": 8.6469, "eval_samples_per_second": 417.259, "eval_steps_per_second": 3.354, "step": 85 }, { "epoch": 4.28, "learning_rate": 6.536108300759776e-05, "loss": 0.8124, "step": 91 }, { "epoch": 4.89, "learning_rate": 7.469838058011172e-05, "loss": 0.791, "step": 104 }, { "epoch": 4.99, "eval_accuracy": 0.8896895787139689, "eval_f1": 0.8908302243934083, "eval_loss": 0.8426142930984497, "eval_precision": 0.8952544356380175, "eval_recall": 0.8896895787139689, "eval_runtime": 7.9673, "eval_samples_per_second": 452.854, "eval_steps_per_second": 3.64, "step": 106 }, { "epoch": 5.51, "learning_rate": 8.403567815262568e-05, "loss": 0.7742, "step": 117 }, { "epoch": 5.98, "eval_accuracy": 0.9077050997782705, "eval_f1": 0.8952158275122053, "eval_loss": 0.8156972527503967, "eval_precision": 0.900683213811247, "eval_recall": 0.9077050997782705, "eval_runtime": 8.0605, "eval_samples_per_second": 447.614, "eval_steps_per_second": 3.598, "step": 127 }, { "epoch": 6.12, "learning_rate": 9.048589657902734e-05, "loss": 0.7771, "step": 130 }, { "epoch": 6.73, "learning_rate": 9.02461453820045e-05, "loss": 0.7696, "step": 143 }, { "epoch": 6.96, "eval_accuracy": 0.9149113082039911, "eval_f1": 0.9089808097871447, "eval_loss": 0.8019198775291443, "eval_precision": 0.9083537029648736, "eval_recall": 0.9149113082039911, "eval_runtime": 8.2664, "eval_samples_per_second": 436.464, "eval_steps_per_second": 3.508, "step": 148 }, { "epoch": 7.34, "learning_rate": 8.971109434044089e-05, "loss": 0.7627, "step": 156 }, { "epoch": 7.95, "learning_rate": 8.888425487558681e-05, "loss": 0.7579, "step": 169 }, { "epoch": 8.0, "eval_accuracy": 0.9099223946784922, "eval_f1": 0.9056360787135247, "eval_loss": 0.8119347095489502, "eval_precision": 0.9037596807714011, "eval_recall": 0.9099223946784922, "eval_runtime": 8.3286, "eval_samples_per_second": 433.208, "eval_steps_per_second": 3.482, "step": 170 }, { "epoch": 8.56, "learning_rate": 8.777105335136256e-05, "loss": 0.753, "step": 182 }, { "epoch": 8.99, "eval_accuracy": 0.9143569844789357, "eval_f1": 0.905016737540752, "eval_loss": 0.8058480024337769, "eval_precision": 0.9043267295510783, "eval_recall": 0.9143569844789357, "eval_runtime": 7.8299, "eval_samples_per_second": 460.796, "eval_steps_per_second": 3.704, "step": 191 }, { "epoch": 9.18, "learning_rate": 8.637879546233632e-05, "loss": 0.7467, "step": 195 }, { "epoch": 9.79, "learning_rate": 8.471661828807179e-05, "loss": 0.7414, "step": 208 }, { "epoch": 9.98, "eval_accuracy": 0.8910753880266076, "eval_f1": 0.8925899353200606, "eval_loss": 0.8334646821022034, "eval_precision": 0.8965909503064864, "eval_recall": 0.8910753880266076, "eval_runtime": 8.1268, "eval_samples_per_second": 443.961, "eval_steps_per_second": 3.568, "step": 212 }, { "epoch": 10.4, "learning_rate": 8.279543032850277e-05, "loss": 0.736, "step": 221 }, { "epoch": 10.96, "eval_accuracy": 0.899390243902439, "eval_f1": 0.9002456226563228, "eval_loss": 0.8323202133178711, "eval_precision": 0.903732584843102, "eval_recall": 0.899390243902439, "eval_runtime": 7.848, "eval_samples_per_second": 459.738, "eval_steps_per_second": 3.695, "step": 233 }, { "epoch": 11.01, "learning_rate": 8.062783991386883e-05, "loss": 0.7351, "step": 234 }, { "epoch": 11.62, "learning_rate": 7.822807245904186e-05, "loss": 0.7312, "step": 247 }, { "epoch": 12.0, "eval_accuracy": 0.9154656319290465, "eval_f1": 0.9086965051403931, "eval_loss": 0.802578330039978, "eval_precision": 0.9043713569516466, "eval_recall": 0.9154656319290465, "eval_runtime": 7.9576, "eval_samples_per_second": 453.405, "eval_steps_per_second": 3.644, "step": 255 }, { "epoch": 12.24, "learning_rate": 7.561187710528515e-05, "loss": 0.7311, "step": 260 }, { "epoch": 12.85, "learning_rate": 7.279642336213425e-05, "loss": 0.722, "step": 273 }, { "epoch": 12.99, "eval_accuracy": 0.9054878048780488, "eval_f1": 0.9053749893268752, "eval_loss": 0.8218502402305603, "eval_precision": 0.9072092893262743, "eval_recall": 0.9054878048780488, "eval_runtime": 8.5776, "eval_samples_per_second": 420.629, "eval_steps_per_second": 3.381, "step": 276 }, { "epoch": 13.46, "learning_rate": 6.980018842771594e-05, "loss": 0.728, "step": 286 }, { "epoch": 13.98, "eval_accuracy": 0.9146341463414634, "eval_f1": 0.9088337129199915, "eval_loss": 0.803844690322876, "eval_precision": 0.9053003849300292, "eval_recall": 0.9146341463414634, "eval_runtime": 8.4963, "eval_samples_per_second": 424.653, "eval_steps_per_second": 3.413, "step": 297 }, { "epoch": 14.07, "learning_rate": 6.664283592699743e-05, "loss": 0.7174, "step": 299 }, { "epoch": 14.68, "learning_rate": 6.33450868637792e-05, "loss": 0.7178, "step": 312 }, { "epoch": 14.96, "eval_accuracy": 0.917960088691796, "eval_f1": 0.9115339219530667, "eval_loss": 0.8020056486129761, "eval_precision": 0.9126518511003248, "eval_recall": 0.917960088691796, "eval_runtime": 8.0058, "eval_samples_per_second": 450.671, "eval_steps_per_second": 3.622, "step": 318 }, { "epoch": 15.29, "learning_rate": 5.99285836333455e-05, "loss": 0.7168, "step": 325 }, { "epoch": 15.91, "learning_rate": 5.6415747988226656e-05, "loss": 0.7181, "step": 338 }, { "epoch": 16.0, "eval_accuracy": 0.9168514412416852, "eval_f1": 0.9074858536331818, "eval_loss": 0.8075320720672607, "eval_precision": 0.9090067831913919, "eval_recall": 0.9168514412416852, "eval_runtime": 8.2679, "eval_samples_per_second": 436.387, "eval_steps_per_second": 3.508, "step": 340 }, { "epoch": 16.52, "learning_rate": 5.282963388921312e-05, "loss": 0.7132, "step": 351 }, { "epoch": 16.99, "eval_accuracy": 0.9115853658536586, "eval_f1": 0.9105576927569372, "eval_loss": 0.8095524311065674, "eval_precision": 0.9105897373648217, "eval_recall": 0.9115853658536586, "eval_runtime": 8.3192, "eval_samples_per_second": 433.694, "eval_steps_per_second": 3.486, "step": 361 }, { "epoch": 17.13, "learning_rate": 4.919377620732666e-05, "loss": 0.7122, "step": 364 }, { "epoch": 17.74, "learning_rate": 4.553203626968464e-05, "loss": 0.7102, "step": 377 }, { "epoch": 17.98, "eval_accuracy": 0.9126940133037694, "eval_f1": 0.9109325265921849, "eval_loss": 0.8063324093818665, "eval_precision": 0.909426612792062, "eval_recall": 0.9126940133037694, "eval_runtime": 8.1988, "eval_samples_per_second": 440.063, "eval_steps_per_second": 3.537, "step": 382 }, { "epoch": 18.35, "learning_rate": 4.1868445262905336e-05, "loss": 0.7107, "step": 390 }, { "epoch": 18.96, "learning_rate": 3.8227046521762955e-05, "loss": 0.7057, "step": 403 }, { "epoch": 18.96, "eval_accuracy": 0.9124168514412417, "eval_f1": 0.9116152740130952, "eval_loss": 0.8127285838127136, "eval_precision": 0.9140500451639162, "eval_recall": 0.9124168514412417, "eval_runtime": 8.2949, "eval_samples_per_second": 434.968, "eval_steps_per_second": 3.496, "step": 403 }, { "epoch": 19.58, "learning_rate": 3.463173773811715e-05, "loss": 0.7102, "step": 416 }, { "epoch": 20.0, "eval_accuracy": 0.9193458980044346, "eval_f1": 0.9124581241091632, "eval_loss": 0.8046479225158691, "eval_precision": 0.9094511683912293, "eval_recall": 0.9193458980044346, "eval_runtime": 8.4514, "eval_samples_per_second": 426.911, "eval_steps_per_second": 3.431, "step": 425 }, { "epoch": 20.19, "learning_rate": 3.1106114125664475e-05, "loss": 0.7031, "step": 429 }, { "epoch": 20.8, "learning_rate": 2.7673313569787155e-05, "loss": 0.6998, "step": 442 }, { "epoch": 20.99, "eval_accuracy": 0.916019955654102, "eval_f1": 0.9107592161617032, "eval_loss": 0.8098756074905396, "eval_precision": 0.9094635680966053, "eval_recall": 0.916019955654102, "eval_runtime": 8.2362, "eval_samples_per_second": 438.069, "eval_steps_per_second": 3.521, "step": 446 }, { "epoch": 21.41, "learning_rate": 2.4355864778745852e-05, "loss": 0.7051, "step": 455 }, { "epoch": 21.98, "eval_accuracy": 0.9174057649667405, "eval_f1": 0.9142268993626627, "eval_loss": 0.8050925731658936, "eval_precision": 0.9130379000974386, "eval_recall": 0.9174057649667405, "eval_runtime": 8.3981, "eval_samples_per_second": 429.62, "eval_steps_per_second": 3.453, "step": 467 }, { "epoch": 22.02, "learning_rate": 2.1175539432766786e-05, "loss": 0.7013, "step": 468 }, { "epoch": 22.64, "learning_rate": 1.8153209301335927e-05, "loss": 0.6986, "step": 481 }, { "epoch": 22.96, "eval_accuracy": 0.9143569844789357, "eval_f1": 0.9094601509445771, "eval_loss": 0.8089693188667297, "eval_precision": 0.9069934469200637, "eval_recall": 0.9143569844789357, "eval_runtime": 8.7255, "eval_samples_per_second": 413.501, "eval_steps_per_second": 3.324, "step": 488 }, { "epoch": 23.25, "learning_rate": 1.5308709266407565e-05, "loss": 0.6993, "step": 494 }, { "epoch": 23.86, "learning_rate": 1.2660707150475642e-05, "loss": 0.7004, "step": 507 }, { "epoch": 24.0, "eval_accuracy": 0.9190687361419069, "eval_f1": 0.9157749931932022, "eval_loss": 0.7969859838485718, "eval_precision": 0.9146257718265792, "eval_recall": 0.9190687361419069, "eval_runtime": 7.8691, "eval_samples_per_second": 458.501, "eval_steps_per_second": 3.685, "step": 510 }, { "epoch": 24.47, "learning_rate": 1.0226581203797468e-05, "loss": 0.6992, "step": 520 }, { "epoch": 24.99, "eval_accuracy": 0.9187915742793792, "eval_f1": 0.9128722156884925, "eval_loss": 0.8054778575897217, "eval_precision": 0.9123823991036795, "eval_recall": 0.9187915742793792, "eval_runtime": 8.3104, "eval_samples_per_second": 434.157, "eval_steps_per_second": 3.49, "step": 531 }, { "epoch": 25.08, "learning_rate": 8.022306054793715e-06, "loss": 0.6988, "step": 533 }, { "epoch": 25.69, "learning_rate": 6.062347872107096e-06, "loss": 0.6956, "step": 546 }, { "epoch": 25.98, "eval_accuracy": 0.9201773835920177, "eval_f1": 0.9159544845078982, "eval_loss": 0.7970059514045715, "eval_precision": 0.9139707421362406, "eval_recall": 0.9201773835920177, "eval_runtime": 8.3576, "eval_samples_per_second": 431.703, "eval_steps_per_second": 3.47, "step": 552 }, { "epoch": 26.31, "learning_rate": 4.359569426347826e-06, "loss": 0.6955, "step": 559 }, { "epoch": 26.92, "learning_rate": 2.925145674584495e-06, "loss": 0.6941, "step": 572 }, { "epoch": 26.96, "eval_accuracy": 0.9193458980044346, "eval_f1": 0.9158537735891641, "eval_loss": 0.8026701807975769, "eval_precision": 0.9141634537835975, "eval_recall": 0.9193458980044346, "eval_runtime": 8.2835, "eval_samples_per_second": 435.562, "eval_steps_per_second": 3.501, "step": 573 }, { "epoch": 27.53, "learning_rate": 1.7684904215807802e-06, "loss": 0.6973, "step": 585 }, { "epoch": 28.0, "eval_accuracy": 0.9149113082039911, "eval_f1": 0.9105265775058081, "eval_loss": 0.8031827807426453, "eval_precision": 0.9092055837026697, "eval_recall": 0.9149113082039911, "eval_runtime": 8.0208, "eval_samples_per_second": 449.829, "eval_steps_per_second": 3.616, "step": 595 }, { "epoch": 28.14, "learning_rate": 8.971945390837938e-07, "loss": 0.698, "step": 598 }, { "epoch": 28.75, "learning_rate": 3.169761486173364e-07, "loss": 0.6969, "step": 611 }, { "epoch": 28.99, "eval_accuracy": 0.9223946784922394, "eval_f1": 0.9180412395863843, "eval_loss": 0.7970722913742065, "eval_precision": 0.9152796171817729, "eval_recall": 0.9223946784922394, "eval_runtime": 8.4656, "eval_samples_per_second": 426.196, "eval_steps_per_second": 3.426, "step": 616 }, { "epoch": 29.36, "learning_rate": 3.1643094719280604e-08, "loss": 0.6981, "step": 624 }, { "epoch": 29.65, "eval_accuracy": 0.9187915742793792, "eval_f1": 0.9142339823689526, "eval_loss": 0.804097056388855, "eval_precision": 0.913375902362099, "eval_recall": 0.9187915742793792, "eval_runtime": 7.8761, "eval_samples_per_second": 458.092, "eval_steps_per_second": 3.682, "step": 630 } ], "logging_steps": 13, "max_steps": 630, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 500, "total_flos": 0.0, "train_batch_size": 128, "trial_name": null, "trial_params": { "_wandb": {}, "assignments": {}, "label_smoothing_factor": 0.029883991666275297, "learning_rate": 9.049996108744304e-05, "metric": "eval/loss", "weight_decay": 0.011787322184488629 } }