lu-vae's picture
Upload folder using huggingface_hub
e52c1e9 verified
{
"best_metric": 0.84512111394795,
"best_model_checkpoint": "./save_models/mrpc/roberta-base_lr1e-05/checkpoint-117",
"epoch": 10.0,
"eval_steps": 500,
"global_step": 130,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6839237057220708,
"eval_averaged_scores": 0.7481107201749513,
"eval_f1": 0.8122977346278317,
"eval_loss": 0.6196000576019287,
"eval_runtime": 0.9135,
"eval_samples_per_second": 401.752,
"eval_steps_per_second": 2.189,
"step": 13
},
{
"epoch": 2.0,
"eval_accuracy": 0.6839237057220708,
"eval_averaged_scores": 0.7481107201749513,
"eval_f1": 0.8122977346278317,
"eval_loss": 0.5717987418174744,
"eval_runtime": 0.9146,
"eval_samples_per_second": 401.283,
"eval_steps_per_second": 2.187,
"step": 26
},
{
"epoch": 3.0,
"eval_accuracy": 0.7084468664850136,
"eval_averaged_scores": 0.7630820363089463,
"eval_f1": 0.8177172061328791,
"eval_loss": 0.5101604461669922,
"eval_runtime": 0.9281,
"eval_samples_per_second": 395.44,
"eval_steps_per_second": 2.155,
"step": 39
},
{
"epoch": 4.0,
"eval_accuracy": 0.7956403269754768,
"eval_averaged_scores": 0.8287593900070754,
"eval_f1": 0.861878453038674,
"eval_loss": 0.45689526200294495,
"eval_runtime": 0.9188,
"eval_samples_per_second": 399.445,
"eval_steps_per_second": 2.177,
"step": 52
},
{
"epoch": 5.0,
"eval_accuracy": 0.771117166212534,
"eval_averaged_scores": 0.7961968809786075,
"eval_f1": 0.8212765957446809,
"eval_loss": 0.42808404564857483,
"eval_runtime": 0.9515,
"eval_samples_per_second": 385.719,
"eval_steps_per_second": 2.102,
"step": 65
},
{
"epoch": 6.0,
"eval_accuracy": 0.8092643051771117,
"eval_averaged_scores": 0.8343510280905638,
"eval_f1": 0.859437751004016,
"eval_loss": 0.4162532687187195,
"eval_runtime": 0.9128,
"eval_samples_per_second": 402.06,
"eval_steps_per_second": 2.191,
"step": 78
},
{
"epoch": 7.0,
"eval_accuracy": 0.8147138964577657,
"eval_averaged_scores": 0.8396278645635442,
"eval_f1": 0.8645418326693227,
"eval_loss": 0.41786280274391174,
"eval_runtime": 1.0619,
"eval_samples_per_second": 345.592,
"eval_steps_per_second": 1.883,
"step": 91
},
{
"epoch": 8.0,
"eval_accuracy": 0.8065395095367848,
"eval_averaged_scores": 0.8318411833398209,
"eval_f1": 0.8571428571428572,
"eval_loss": 0.4168005883693695,
"eval_runtime": 0.9219,
"eval_samples_per_second": 398.082,
"eval_steps_per_second": 2.169,
"step": 104
},
{
"epoch": 9.0,
"eval_accuracy": 0.8201634877384196,
"eval_averaged_scores": 0.84512111394795,
"eval_f1": 0.8700787401574802,
"eval_loss": 0.42427295446395874,
"eval_runtime": 0.9217,
"eval_samples_per_second": 398.165,
"eval_steps_per_second": 2.17,
"step": 117
},
{
"epoch": 10.0,
"eval_accuracy": 0.8119891008174387,
"eval_averaged_scores": 0.8374060812238286,
"eval_f1": 0.8628230616302187,
"eval_loss": 0.42201152443885803,
"eval_runtime": 0.9117,
"eval_samples_per_second": 402.525,
"eval_steps_per_second": 2.194,
"step": 130
},
{
"epoch": 10.0,
"step": 130,
"total_flos": 1559281933489620.0,
"train_loss": 0.44359661982609677,
"train_runtime": 101.3918,
"train_samples_per_second": 325.569,
"train_steps_per_second": 1.282
}
],
"logging_steps": 500,
"max_steps": 130,
"num_input_tokens_seen": 0,
"num_train_epochs": 10,
"save_steps": 500,
"total_flos": 1559281933489620.0,
"train_batch_size": 256,
"trial_name": null,
"trial_params": null
}