spanish-social-media-boxing-text / trainer_state.json
lzun's picture
Upload 7 files
741cec0 verified
{
"best_metric": 0.734091493336525,
"best_model_checkpoint": "dccuchile/bert-base-spanish-wwm-cased-finetuned-agm-17\\checkpoint-1134",
"epoch": 17.0,
"global_step": 2754,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6146788990825688,
"eval_balanced_accuracy": 0.5496493170911775,
"eval_f1": 0.5802121406999178,
"eval_loss": 0.8864156603813171,
"eval_matthews_corr": 0.39264781381473346,
"eval_runtime": 0.9448,
"eval_samples_per_second": 115.366,
"eval_steps_per_second": 29.635,
"step": 162
},
{
"epoch": 2.0,
"eval_accuracy": 0.6605504587155964,
"eval_balanced_accuracy": 0.6356589147286821,
"eval_f1": 0.6507029674865616,
"eval_loss": 1.221592903137207,
"eval_matthews_corr": 0.49655588625297953,
"eval_runtime": 0.9703,
"eval_samples_per_second": 112.333,
"eval_steps_per_second": 28.856,
"step": 324
},
{
"epoch": 3.0,
"eval_accuracy": 0.6972477064220184,
"eval_balanced_accuracy": 0.6861849390919158,
"eval_f1": 0.6963201171916769,
"eval_loss": 1.493444561958313,
"eval_matthews_corr": 0.5327691486032612,
"eval_runtime": 0.9853,
"eval_samples_per_second": 110.622,
"eval_steps_per_second": 28.417,
"step": 486
},
{
"epoch": 3.09,
"learning_rate": 1.9382716049382716e-05,
"loss": 0.6321,
"step": 500
},
{
"epoch": 4.0,
"eval_accuracy": 0.6330275229357798,
"eval_balanced_accuracy": 0.5891472868217055,
"eval_f1": 0.6237818038867272,
"eval_loss": 2.305826425552368,
"eval_matthews_corr": 0.42950850046817396,
"eval_runtime": 0.9899,
"eval_samples_per_second": 110.115,
"eval_steps_per_second": 28.286,
"step": 648
},
{
"epoch": 5.0,
"eval_accuracy": 0.7155963302752294,
"eval_balanced_accuracy": 0.6784330011074197,
"eval_f1": 0.7083841635992166,
"eval_loss": 2.0942306518554688,
"eval_matthews_corr": 0.5558220202942262,
"eval_runtime": 1.0146,
"eval_samples_per_second": 107.432,
"eval_steps_per_second": 27.597,
"step": 810
},
{
"epoch": 6.0,
"eval_accuracy": 0.6972477064220184,
"eval_balanced_accuracy": 0.6861849390919158,
"eval_f1": 0.6961474988021934,
"eval_loss": 2.0568454265594482,
"eval_matthews_corr": 0.5347932844649809,
"eval_runtime": 1.0033,
"eval_samples_per_second": 108.642,
"eval_steps_per_second": 27.908,
"step": 972
},
{
"epoch": 6.17,
"learning_rate": 1.8765432098765433e-05,
"loss": 0.0821,
"step": 1000
},
{
"epoch": 7.0,
"eval_accuracy": 0.7339449541284404,
"eval_balanced_accuracy": 0.7305740125507567,
"eval_f1": 0.734091493336525,
"eval_loss": 1.9095344543457031,
"eval_matthews_corr": 0.5921023400775965,
"eval_runtime": 1.0123,
"eval_samples_per_second": 107.676,
"eval_steps_per_second": 27.66,
"step": 1134
},
{
"epoch": 8.0,
"eval_accuracy": 0.6972477064220184,
"eval_balanced_accuracy": 0.7045957918050941,
"eval_f1": 0.6974540186265638,
"eval_loss": 2.486194372177124,
"eval_matthews_corr": 0.5398860870112605,
"eval_runtime": 0.9899,
"eval_samples_per_second": 110.11,
"eval_steps_per_second": 28.285,
"step": 1296
},
{
"epoch": 9.0,
"eval_accuracy": 0.6880733944954128,
"eval_balanced_accuracy": 0.6782484311554079,
"eval_f1": 0.6864400889630247,
"eval_loss": 2.647495746612549,
"eval_matthews_corr": 0.5182982198223602,
"eval_runtime": 0.9899,
"eval_samples_per_second": 110.111,
"eval_steps_per_second": 28.285,
"step": 1458
},
{
"epoch": 9.26,
"learning_rate": 1.814814814814815e-05,
"loss": 0.0135,
"step": 1500
},
{
"epoch": 10.0,
"eval_accuracy": 0.6605504587155964,
"eval_balanced_accuracy": 0.6484865263935031,
"eval_f1": 0.657183720633772,
"eval_loss": 2.9095847606658936,
"eval_matthews_corr": 0.47901280675974883,
"eval_runtime": 1.0213,
"eval_samples_per_second": 106.73,
"eval_steps_per_second": 27.417,
"step": 1620
},
{
"epoch": 11.0,
"eval_accuracy": 0.6788990825688074,
"eval_balanced_accuracy": 0.6703119232189,
"eval_f1": 0.676130818235054,
"eval_loss": 2.872298240661621,
"eval_matthews_corr": 0.5061412972412488,
"eval_runtime": 0.9822,
"eval_samples_per_second": 110.977,
"eval_steps_per_second": 28.508,
"step": 1782
},
{
"epoch": 12.0,
"eval_accuracy": 0.6880733944954128,
"eval_balanced_accuracy": 0.6782484311554079,
"eval_f1": 0.6858583201079531,
"eval_loss": 2.9195542335510254,
"eval_matthews_corr": 0.5189987961354203,
"eval_runtime": 0.986,
"eval_samples_per_second": 110.548,
"eval_steps_per_second": 28.398,
"step": 1944
},
{
"epoch": 12.35,
"learning_rate": 1.7530864197530865e-05,
"loss": 0.0036,
"step": 2000
},
{
"epoch": 13.0,
"eval_accuracy": 0.6880733944954128,
"eval_balanced_accuracy": 0.6782484311554079,
"eval_f1": 0.6858583201079531,
"eval_loss": 2.9513614177703857,
"eval_matthews_corr": 0.5189987961354203,
"eval_runtime": 0.9892,
"eval_samples_per_second": 110.19,
"eval_steps_per_second": 28.306,
"step": 2106
},
{
"epoch": 14.0,
"eval_accuracy": 0.6788990825688074,
"eval_balanced_accuracy": 0.6703119232189,
"eval_f1": 0.676130818235054,
"eval_loss": 3.039541006088257,
"eval_matthews_corr": 0.5061412972412488,
"eval_runtime": 0.9838,
"eval_samples_per_second": 110.798,
"eval_steps_per_second": 28.462,
"step": 2268
},
{
"epoch": 15.0,
"eval_accuracy": 0.6788990825688074,
"eval_balanced_accuracy": 0.664359542266519,
"eval_f1": 0.6764317486794551,
"eval_loss": 3.0635788440704346,
"eval_matthews_corr": 0.5038272910414593,
"eval_runtime": 0.9927,
"eval_samples_per_second": 109.797,
"eval_steps_per_second": 28.205,
"step": 2430
},
{
"epoch": 15.43,
"learning_rate": 1.6913580246913582e-05,
"loss": 0.0001,
"step": 2500
},
{
"epoch": 16.0,
"eval_accuracy": 0.6788990825688074,
"eval_balanced_accuracy": 0.664359542266519,
"eval_f1": 0.6764317486794551,
"eval_loss": 3.103422164916992,
"eval_matthews_corr": 0.5038272910414593,
"eval_runtime": 0.989,
"eval_samples_per_second": 110.21,
"eval_steps_per_second": 28.311,
"step": 2592
},
{
"epoch": 17.0,
"eval_accuracy": 0.6788990825688074,
"eval_balanced_accuracy": 0.664359542266519,
"eval_f1": 0.6764317486794551,
"eval_loss": 3.1538658142089844,
"eval_matthews_corr": 0.5038272910414593,
"eval_runtime": 0.9887,
"eval_samples_per_second": 110.246,
"eval_steps_per_second": 28.32,
"step": 2754
}
],
"max_steps": 16200,
"num_train_epochs": 100,
"total_flos": 1222786719713664.0,
"trial_name": null,
"trial_params": null
}