|
{
|
|
"best_metric": 0.734091493336525,
|
|
"best_model_checkpoint": "dccuchile/bert-base-spanish-wwm-cased-finetuned-agm-17\\checkpoint-1134",
|
|
"epoch": 17.0,
|
|
"global_step": 2754,
|
|
"is_hyper_param_search": false,
|
|
"is_local_process_zero": true,
|
|
"is_world_process_zero": true,
|
|
"log_history": [
|
|
{
|
|
"epoch": 1.0,
|
|
"eval_accuracy": 0.6146788990825688,
|
|
"eval_balanced_accuracy": 0.5496493170911775,
|
|
"eval_f1": 0.5802121406999178,
|
|
"eval_loss": 0.8864156603813171,
|
|
"eval_matthews_corr": 0.39264781381473346,
|
|
"eval_runtime": 0.9448,
|
|
"eval_samples_per_second": 115.366,
|
|
"eval_steps_per_second": 29.635,
|
|
"step": 162
|
|
},
|
|
{
|
|
"epoch": 2.0,
|
|
"eval_accuracy": 0.6605504587155964,
|
|
"eval_balanced_accuracy": 0.6356589147286821,
|
|
"eval_f1": 0.6507029674865616,
|
|
"eval_loss": 1.221592903137207,
|
|
"eval_matthews_corr": 0.49655588625297953,
|
|
"eval_runtime": 0.9703,
|
|
"eval_samples_per_second": 112.333,
|
|
"eval_steps_per_second": 28.856,
|
|
"step": 324
|
|
},
|
|
{
|
|
"epoch": 3.0,
|
|
"eval_accuracy": 0.6972477064220184,
|
|
"eval_balanced_accuracy": 0.6861849390919158,
|
|
"eval_f1": 0.6963201171916769,
|
|
"eval_loss": 1.493444561958313,
|
|
"eval_matthews_corr": 0.5327691486032612,
|
|
"eval_runtime": 0.9853,
|
|
"eval_samples_per_second": 110.622,
|
|
"eval_steps_per_second": 28.417,
|
|
"step": 486
|
|
},
|
|
{
|
|
"epoch": 3.09,
|
|
"learning_rate": 1.9382716049382716e-05,
|
|
"loss": 0.6321,
|
|
"step": 500
|
|
},
|
|
{
|
|
"epoch": 4.0,
|
|
"eval_accuracy": 0.6330275229357798,
|
|
"eval_balanced_accuracy": 0.5891472868217055,
|
|
"eval_f1": 0.6237818038867272,
|
|
"eval_loss": 2.305826425552368,
|
|
"eval_matthews_corr": 0.42950850046817396,
|
|
"eval_runtime": 0.9899,
|
|
"eval_samples_per_second": 110.115,
|
|
"eval_steps_per_second": 28.286,
|
|
"step": 648
|
|
},
|
|
{
|
|
"epoch": 5.0,
|
|
"eval_accuracy": 0.7155963302752294,
|
|
"eval_balanced_accuracy": 0.6784330011074197,
|
|
"eval_f1": 0.7083841635992166,
|
|
"eval_loss": 2.0942306518554688,
|
|
"eval_matthews_corr": 0.5558220202942262,
|
|
"eval_runtime": 1.0146,
|
|
"eval_samples_per_second": 107.432,
|
|
"eval_steps_per_second": 27.597,
|
|
"step": 810
|
|
},
|
|
{
|
|
"epoch": 6.0,
|
|
"eval_accuracy": 0.6972477064220184,
|
|
"eval_balanced_accuracy": 0.6861849390919158,
|
|
"eval_f1": 0.6961474988021934,
|
|
"eval_loss": 2.0568454265594482,
|
|
"eval_matthews_corr": 0.5347932844649809,
|
|
"eval_runtime": 1.0033,
|
|
"eval_samples_per_second": 108.642,
|
|
"eval_steps_per_second": 27.908,
|
|
"step": 972
|
|
},
|
|
{
|
|
"epoch": 6.17,
|
|
"learning_rate": 1.8765432098765433e-05,
|
|
"loss": 0.0821,
|
|
"step": 1000
|
|
},
|
|
{
|
|
"epoch": 7.0,
|
|
"eval_accuracy": 0.7339449541284404,
|
|
"eval_balanced_accuracy": 0.7305740125507567,
|
|
"eval_f1": 0.734091493336525,
|
|
"eval_loss": 1.9095344543457031,
|
|
"eval_matthews_corr": 0.5921023400775965,
|
|
"eval_runtime": 1.0123,
|
|
"eval_samples_per_second": 107.676,
|
|
"eval_steps_per_second": 27.66,
|
|
"step": 1134
|
|
},
|
|
{
|
|
"epoch": 8.0,
|
|
"eval_accuracy": 0.6972477064220184,
|
|
"eval_balanced_accuracy": 0.7045957918050941,
|
|
"eval_f1": 0.6974540186265638,
|
|
"eval_loss": 2.486194372177124,
|
|
"eval_matthews_corr": 0.5398860870112605,
|
|
"eval_runtime": 0.9899,
|
|
"eval_samples_per_second": 110.11,
|
|
"eval_steps_per_second": 28.285,
|
|
"step": 1296
|
|
},
|
|
{
|
|
"epoch": 9.0,
|
|
"eval_accuracy": 0.6880733944954128,
|
|
"eval_balanced_accuracy": 0.6782484311554079,
|
|
"eval_f1": 0.6864400889630247,
|
|
"eval_loss": 2.647495746612549,
|
|
"eval_matthews_corr": 0.5182982198223602,
|
|
"eval_runtime": 0.9899,
|
|
"eval_samples_per_second": 110.111,
|
|
"eval_steps_per_second": 28.285,
|
|
"step": 1458
|
|
},
|
|
{
|
|
"epoch": 9.26,
|
|
"learning_rate": 1.814814814814815e-05,
|
|
"loss": 0.0135,
|
|
"step": 1500
|
|
},
|
|
{
|
|
"epoch": 10.0,
|
|
"eval_accuracy": 0.6605504587155964,
|
|
"eval_balanced_accuracy": 0.6484865263935031,
|
|
"eval_f1": 0.657183720633772,
|
|
"eval_loss": 2.9095847606658936,
|
|
"eval_matthews_corr": 0.47901280675974883,
|
|
"eval_runtime": 1.0213,
|
|
"eval_samples_per_second": 106.73,
|
|
"eval_steps_per_second": 27.417,
|
|
"step": 1620
|
|
},
|
|
{
|
|
"epoch": 11.0,
|
|
"eval_accuracy": 0.6788990825688074,
|
|
"eval_balanced_accuracy": 0.6703119232189,
|
|
"eval_f1": 0.676130818235054,
|
|
"eval_loss": 2.872298240661621,
|
|
"eval_matthews_corr": 0.5061412972412488,
|
|
"eval_runtime": 0.9822,
|
|
"eval_samples_per_second": 110.977,
|
|
"eval_steps_per_second": 28.508,
|
|
"step": 1782
|
|
},
|
|
{
|
|
"epoch": 12.0,
|
|
"eval_accuracy": 0.6880733944954128,
|
|
"eval_balanced_accuracy": 0.6782484311554079,
|
|
"eval_f1": 0.6858583201079531,
|
|
"eval_loss": 2.9195542335510254,
|
|
"eval_matthews_corr": 0.5189987961354203,
|
|
"eval_runtime": 0.986,
|
|
"eval_samples_per_second": 110.548,
|
|
"eval_steps_per_second": 28.398,
|
|
"step": 1944
|
|
},
|
|
{
|
|
"epoch": 12.35,
|
|
"learning_rate": 1.7530864197530865e-05,
|
|
"loss": 0.0036,
|
|
"step": 2000
|
|
},
|
|
{
|
|
"epoch": 13.0,
|
|
"eval_accuracy": 0.6880733944954128,
|
|
"eval_balanced_accuracy": 0.6782484311554079,
|
|
"eval_f1": 0.6858583201079531,
|
|
"eval_loss": 2.9513614177703857,
|
|
"eval_matthews_corr": 0.5189987961354203,
|
|
"eval_runtime": 0.9892,
|
|
"eval_samples_per_second": 110.19,
|
|
"eval_steps_per_second": 28.306,
|
|
"step": 2106
|
|
},
|
|
{
|
|
"epoch": 14.0,
|
|
"eval_accuracy": 0.6788990825688074,
|
|
"eval_balanced_accuracy": 0.6703119232189,
|
|
"eval_f1": 0.676130818235054,
|
|
"eval_loss": 3.039541006088257,
|
|
"eval_matthews_corr": 0.5061412972412488,
|
|
"eval_runtime": 0.9838,
|
|
"eval_samples_per_second": 110.798,
|
|
"eval_steps_per_second": 28.462,
|
|
"step": 2268
|
|
},
|
|
{
|
|
"epoch": 15.0,
|
|
"eval_accuracy": 0.6788990825688074,
|
|
"eval_balanced_accuracy": 0.664359542266519,
|
|
"eval_f1": 0.6764317486794551,
|
|
"eval_loss": 3.0635788440704346,
|
|
"eval_matthews_corr": 0.5038272910414593,
|
|
"eval_runtime": 0.9927,
|
|
"eval_samples_per_second": 109.797,
|
|
"eval_steps_per_second": 28.205,
|
|
"step": 2430
|
|
},
|
|
{
|
|
"epoch": 15.43,
|
|
"learning_rate": 1.6913580246913582e-05,
|
|
"loss": 0.0001,
|
|
"step": 2500
|
|
},
|
|
{
|
|
"epoch": 16.0,
|
|
"eval_accuracy": 0.6788990825688074,
|
|
"eval_balanced_accuracy": 0.664359542266519,
|
|
"eval_f1": 0.6764317486794551,
|
|
"eval_loss": 3.103422164916992,
|
|
"eval_matthews_corr": 0.5038272910414593,
|
|
"eval_runtime": 0.989,
|
|
"eval_samples_per_second": 110.21,
|
|
"eval_steps_per_second": 28.311,
|
|
"step": 2592
|
|
},
|
|
{
|
|
"epoch": 17.0,
|
|
"eval_accuracy": 0.6788990825688074,
|
|
"eval_balanced_accuracy": 0.664359542266519,
|
|
"eval_f1": 0.6764317486794551,
|
|
"eval_loss": 3.1538658142089844,
|
|
"eval_matthews_corr": 0.5038272910414593,
|
|
"eval_runtime": 0.9887,
|
|
"eval_samples_per_second": 110.246,
|
|
"eval_steps_per_second": 28.32,
|
|
"step": 2754
|
|
}
|
|
],
|
|
"max_steps": 16200,
|
|
"num_train_epochs": 100,
|
|
"total_flos": 1222786719713664.0,
|
|
"trial_name": null,
|
|
"trial_params": null
|
|
}
|
|
|