bioner_bc5cdr / trainer_state.json
jakelever's picture
Upload folder using huggingface_hub
6eaba08 verified
{
"best_metric": 0.9321585507595793,
"best_model_checkpoint": "tmp_ner_fantastic-bale-10_45/run-33/checkpoint-875",
"epoch": 7.0,
"eval_steps": 500,
"global_step": 875,
"is_hyper_param_search": true,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.9730935342517575,
"eval_loss": 0.08587262034416199,
"eval_macro_f1": 0.9170047043200686,
"eval_macro_precision": 0.9278276425309375,
"eval_macro_recall": 0.90752738549263,
"eval_runtime": 5.7832,
"eval_samples_per_second": 172.914,
"eval_steps_per_second": 21.614,
"step": 125
},
{
"epoch": 2.0,
"eval_accuracy": 0.9750480754074587,
"eval_loss": 0.08141306042671204,
"eval_macro_f1": 0.9264657139223695,
"eval_macro_precision": 0.9157927892781152,
"eval_macro_recall": 0.9377952332788448,
"eval_runtime": 6.0324,
"eval_samples_per_second": 165.773,
"eval_steps_per_second": 20.722,
"step": 250
},
{
"epoch": 3.0,
"eval_accuracy": 0.9743781721887709,
"eval_loss": 0.08608711510896683,
"eval_macro_f1": 0.9247086477797719,
"eval_macro_precision": 0.9173611315562689,
"eval_macro_recall": 0.933305032585042,
"eval_runtime": 6.0132,
"eval_samples_per_second": 166.3,
"eval_steps_per_second": 20.787,
"step": 375
},
{
"epoch": 4.0,
"grad_norm": 0.6703500151634216,
"learning_rate": 5.4624258845588244e-05,
"loss": 0.1282,
"step": 500
},
{
"epoch": 4.0,
"eval_accuracy": 0.9770420226348476,
"eval_loss": 0.09856158494949341,
"eval_macro_f1": 0.9314150814858593,
"eval_macro_precision": 0.9211465798788551,
"eval_macro_recall": 0.9421883284262093,
"eval_runtime": 5.932,
"eval_samples_per_second": 168.577,
"eval_steps_per_second": 21.072,
"step": 500
},
{
"epoch": 5.0,
"eval_accuracy": 0.9750086693357712,
"eval_loss": 0.11021321266889572,
"eval_macro_f1": 0.9267488028708639,
"eval_macro_precision": 0.9153942226603791,
"eval_macro_recall": 0.9386080517042859,
"eval_runtime": 5.9689,
"eval_samples_per_second": 167.536,
"eval_steps_per_second": 20.942,
"step": 625
},
{
"epoch": 6.0,
"eval_accuracy": 0.9760253459853094,
"eval_loss": 0.11098870635032654,
"eval_macro_f1": 0.9287954097228024,
"eval_macro_precision": 0.9205523043756338,
"eval_macro_recall": 0.9374208211553338,
"eval_runtime": 5.9208,
"eval_samples_per_second": 168.896,
"eval_steps_per_second": 21.112,
"step": 750
},
{
"epoch": 7.0,
"eval_accuracy": 0.9773021027079852,
"eval_loss": 0.11490638554096222,
"eval_macro_f1": 0.9321585507595793,
"eval_macro_precision": 0.9266098427277691,
"eval_macro_recall": 0.9378807443139501,
"eval_runtime": 6.075,
"eval_samples_per_second": 164.61,
"eval_steps_per_second": 20.576,
"step": 875
}
],
"logging_steps": 500,
"max_steps": 4000,
"num_input_tokens_seen": 0,
"num_train_epochs": 32,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 3,
"early_stopping_threshold": 0.001
},
"attributes": {
"early_stopping_patience_counter": 3
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 723885139142880.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": {
"learning_rate": 6.150691546013236e-05,
"per_device_train_batch_size": 8,
"warmup_ratio": 0.014555287490025246,
"weight_decay": 0.02919246813677108
}
}