|
{ |
|
"best_metric": 0.8626177714583143, |
|
"best_model_checkpoint": "result/my-sup-simcse-bert-base-uncased/SupCon-28-100.0-3e-6-0.05-0.00", |
|
"epoch": 2.9953703703703702, |
|
"global_step": 645, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.58, |
|
"eval_avg_sts": 0.834701718312026, |
|
"eval_sickr_spearman": 0.817920809860896, |
|
"eval_stsb_spearman": 0.851482626763156, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 1.16, |
|
"eval_avg_sts": 0.8365837614673681, |
|
"eval_sickr_spearman": 0.8167967379939398, |
|
"eval_stsb_spearman": 0.8563707849407965, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 1.74, |
|
"eval_avg_sts": 0.8407075744602279, |
|
"eval_sickr_spearman": 0.8187973774621414, |
|
"eval_stsb_spearman": 0.8626177714583143, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 2.32, |
|
"learning_rate": 1.1419753086419753e-05, |
|
"loss": 0.7185, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.32, |
|
"eval_avg_sts": 0.8370980558240873, |
|
"eval_sickr_spearman": 0.812430662842114, |
|
"eval_stsb_spearman": 0.8617654488060604, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.9, |
|
"eval_avg_sts": 0.8378817327123782, |
|
"eval_sickr_spearman": 0.814155075445945, |
|
"eval_stsb_spearman": 0.8616083899788114, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"step": 645, |
|
"total_flos": 52908914324275200, |
|
"train_runtime": 863.9621, |
|
"train_samples_per_second": 0.75 |
|
} |
|
], |
|
"max_steps": 648, |
|
"num_train_epochs": 3, |
|
"total_flos": 52908914324275200, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|