Md Mushfiqur Rahman
Upload with huggingface_hub
a15dae3
{
"best_metric": 14.889152449594015,
"best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/bert/bert-base-finetuned-parsing-ud-Coptic-Scriptorium/checkpoint-500",
"epoch": 76.92307692307692,
"global_step": 3000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 2.56,
"learning_rate": 7.6e-05,
"loss": 5.3836,
"step": 100
},
{
"epoch": 5.13,
"learning_rate": 7.948993288590604e-05,
"loss": 4.1364,
"step": 200
},
{
"epoch": 7.69,
"learning_rate": 7.895302013422819e-05,
"loss": 3.8943,
"step": 300
},
{
"epoch": 10.26,
"learning_rate": 7.841610738255034e-05,
"loss": 3.7384,
"step": 400
},
{
"epoch": 12.82,
"learning_rate": 7.787919463087249e-05,
"loss": 3.5767,
"step": 500
},
{
"epoch": 12.82,
"eval_las": 14.889152449594015,
"eval_loss": 4.103353500366211,
"eval_runtime": 2.9493,
"eval_samples_per_second": 129.182,
"eval_steps_per_second": 16.275,
"eval_uas": 31.748928017516647,
"step": 500
},
{
"epoch": 15.38,
"learning_rate": 7.734228187919463e-05,
"loss": 3.4084,
"step": 600
},
{
"epoch": 17.95,
"learning_rate": 7.680536912751678e-05,
"loss": 3.2001,
"step": 700
},
{
"epoch": 20.51,
"learning_rate": 7.626845637583893e-05,
"loss": 2.9538,
"step": 800
},
{
"epoch": 23.08,
"learning_rate": 7.573154362416108e-05,
"loss": 2.7223,
"step": 900
},
{
"epoch": 25.64,
"learning_rate": 7.519463087248323e-05,
"loss": 2.4472,
"step": 1000
},
{
"epoch": 25.64,
"eval_las": 11.248973633792538,
"eval_loss": 5.691993713378906,
"eval_runtime": 2.9489,
"eval_samples_per_second": 129.203,
"eval_steps_per_second": 16.278,
"eval_uas": 27.926284098166228,
"step": 1000
},
{
"epoch": 28.21,
"learning_rate": 7.465771812080537e-05,
"loss": 2.2519,
"step": 1100
},
{
"epoch": 30.77,
"learning_rate": 7.412080536912752e-05,
"loss": 2.0317,
"step": 1200
},
{
"epoch": 33.33,
"learning_rate": 7.358389261744967e-05,
"loss": 1.8544,
"step": 1300
},
{
"epoch": 35.9,
"learning_rate": 7.304697986577182e-05,
"loss": 1.7134,
"step": 1400
},
{
"epoch": 38.46,
"learning_rate": 7.251006711409397e-05,
"loss": 1.5671,
"step": 1500
},
{
"epoch": 38.46,
"eval_las": 9.871362101997994,
"eval_loss": 7.934547424316406,
"eval_runtime": 2.9464,
"eval_samples_per_second": 129.311,
"eval_steps_per_second": 16.291,
"eval_uas": 25.444758689900553,
"step": 1500
},
{
"epoch": 41.03,
"learning_rate": 7.197315436241612e-05,
"loss": 1.4647,
"step": 1600
},
{
"epoch": 43.59,
"learning_rate": 7.143624161073826e-05,
"loss": 1.3584,
"step": 1700
},
{
"epoch": 46.15,
"learning_rate": 7.089932885906041e-05,
"loss": 1.2918,
"step": 1800
},
{
"epoch": 48.72,
"learning_rate": 7.036241610738256e-05,
"loss": 1.2333,
"step": 1900
},
{
"epoch": 51.28,
"learning_rate": 6.982550335570471e-05,
"loss": 1.2108,
"step": 2000
},
{
"epoch": 51.28,
"eval_las": 9.570294681142231,
"eval_loss": 10.208051681518555,
"eval_runtime": 2.9507,
"eval_samples_per_second": 129.123,
"eval_steps_per_second": 16.267,
"eval_uas": 24.58717270322051,
"step": 2000
},
{
"epoch": 53.85,
"learning_rate": 6.928859060402686e-05,
"loss": 1.1363,
"step": 2100
},
{
"epoch": 56.41,
"learning_rate": 6.8751677852349e-05,
"loss": 1.1452,
"step": 2200
},
{
"epoch": 58.97,
"learning_rate": 6.821476510067115e-05,
"loss": 1.0937,
"step": 2300
},
{
"epoch": 61.54,
"learning_rate": 6.76778523489933e-05,
"loss": 1.0555,
"step": 2400
},
{
"epoch": 64.1,
"learning_rate": 6.714093959731544e-05,
"loss": 1.0311,
"step": 2500
},
{
"epoch": 64.1,
"eval_las": 9.707143508803942,
"eval_loss": 11.06482219696045,
"eval_runtime": 2.9481,
"eval_samples_per_second": 129.236,
"eval_steps_per_second": 16.282,
"eval_uas": 24.368214578961776,
"step": 2500
},
{
"epoch": 66.67,
"learning_rate": 6.660402684563758e-05,
"loss": 1.0068,
"step": 2600
},
{
"epoch": 69.23,
"learning_rate": 6.606711409395973e-05,
"loss": 1.0095,
"step": 2700
},
{
"epoch": 71.79,
"learning_rate": 6.553020134228188e-05,
"loss": 0.9792,
"step": 2800
},
{
"epoch": 74.36,
"learning_rate": 6.499328859060403e-05,
"loss": 0.988,
"step": 2900
},
{
"epoch": 76.92,
"learning_rate": 6.445637583892618e-05,
"loss": 0.9661,
"step": 3000
},
{
"epoch": 76.92,
"eval_las": 9.670650488094152,
"eval_loss": 10.523516654968262,
"eval_runtime": 2.9465,
"eval_samples_per_second": 129.304,
"eval_steps_per_second": 16.29,
"eval_uas": 24.41383085484901,
"step": 3000
},
{
"epoch": 76.92,
"step": 3000,
"total_flos": 1.5763284763250688e+16,
"train_loss": 2.0616751454671225,
"train_runtime": 1642.7036,
"train_samples_per_second": 292.201,
"train_steps_per_second": 9.131
}
],
"max_steps": 15000,
"num_train_epochs": 385,
"total_flos": 1.5763284763250688e+16,
"trial_name": null,
"trial_params": null
}