File size: 1,956 Bytes
b4529a5 4b62f7f 04f2323 4b62f7f b4529a5 04f2323 4b62f7f b4529a5 4b62f7f b4529a5 04f2323 4b62f7f b4529a5 b9e55ce 04f2323 4b62f7f b9e55ce 4b62f7f b9e55ce 04f2323 4b62f7f 04f2323 4b62f7f 04f2323 4b62f7f 04f2323 4b62f7f 04f2323 4b62f7f 04f2323 4b62f7f 04f2323 4b62f7f 04f2323 b4529a5 04f2323 b4529a5 04f2323 d8da5d6 b4529a5 4b62f7f b4529a5 4b62f7f b4529a5 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.021052631578947368,
"eval_steps": 3,
"global_step": 5,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.004210526315789474,
"grad_norm": 6.040051460266113,
"learning_rate": 2e-05,
"loss": 5.2097,
"step": 1
},
{
"epoch": 0.004210526315789474,
"eval_loss": 5.1479387283325195,
"eval_runtime": 33.4641,
"eval_samples_per_second": 2.988,
"eval_steps_per_second": 1.494,
"step": 1
},
{
"epoch": 0.008421052631578947,
"grad_norm": 6.306079387664795,
"learning_rate": 4e-05,
"loss": 5.1825,
"step": 2
},
{
"epoch": 0.01263157894736842,
"grad_norm": 6.255680561065674,
"learning_rate": 6e-05,
"loss": 5.2103,
"step": 3
},
{
"epoch": 0.01263157894736842,
"eval_loss": 5.074653625488281,
"eval_runtime": 33.571,
"eval_samples_per_second": 2.979,
"eval_steps_per_second": 1.489,
"step": 3
},
{
"epoch": 0.016842105263157894,
"grad_norm": 6.213514804840088,
"learning_rate": 8e-05,
"loss": 5.0592,
"step": 4
},
{
"epoch": 0.021052631578947368,
"grad_norm": 6.902180194854736,
"learning_rate": 0.0001,
"loss": 4.7818,
"step": 5
}
],
"logging_steps": 1,
"max_steps": 10,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 5,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 2818744422236160.0,
"train_batch_size": 2,
"trial_name": null,
"trial_params": null
}
|