{ "best_metric": 0.6466411352157593, "best_model_checkpoint": "BERT-WMM/run-5/checkpoint-267", "epoch": 1.0, "eval_steps": 500, "global_step": 267, "is_hyper_param_search": true, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7338028169014085, "eval_loss": 0.6466411352157593, "eval_runtime": 2.0904, "eval_samples_per_second": 1018.923, "eval_steps_per_second": 64.101, "step": 267 } ], "logging_steps": 500, "max_steps": 534, "num_input_tokens_seen": 0, "num_train_epochs": 2, "save_steps": 500, "total_flos": 0, "train_batch_size": 32, "trial_name": null, "trial_params": { "learning_rate": 8.887574420426101e-06, "num_train_epochs": 2, "per_device_train_batch_size": 32, "weight_decay": 1.6818908255902827e-05 } }