|
{ |
|
"best_metric": 0.9321585507595793, |
|
"best_model_checkpoint": "tmp_ner_fantastic-bale-10_45/run-33/checkpoint-875", |
|
"epoch": 7.0, |
|
"eval_steps": 500, |
|
"global_step": 875, |
|
"is_hyper_param_search": true, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9730935342517575, |
|
"eval_loss": 0.08587262034416199, |
|
"eval_macro_f1": 0.9170047043200686, |
|
"eval_macro_precision": 0.9278276425309375, |
|
"eval_macro_recall": 0.90752738549263, |
|
"eval_runtime": 5.7832, |
|
"eval_samples_per_second": 172.914, |
|
"eval_steps_per_second": 21.614, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.9750480754074587, |
|
"eval_loss": 0.08141306042671204, |
|
"eval_macro_f1": 0.9264657139223695, |
|
"eval_macro_precision": 0.9157927892781152, |
|
"eval_macro_recall": 0.9377952332788448, |
|
"eval_runtime": 6.0324, |
|
"eval_samples_per_second": 165.773, |
|
"eval_steps_per_second": 20.722, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9743781721887709, |
|
"eval_loss": 0.08608711510896683, |
|
"eval_macro_f1": 0.9247086477797719, |
|
"eval_macro_precision": 0.9173611315562689, |
|
"eval_macro_recall": 0.933305032585042, |
|
"eval_runtime": 6.0132, |
|
"eval_samples_per_second": 166.3, |
|
"eval_steps_per_second": 20.787, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 0.6703500151634216, |
|
"learning_rate": 5.4624258845588244e-05, |
|
"loss": 0.1282, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9770420226348476, |
|
"eval_loss": 0.09856158494949341, |
|
"eval_macro_f1": 0.9314150814858593, |
|
"eval_macro_precision": 0.9211465798788551, |
|
"eval_macro_recall": 0.9421883284262093, |
|
"eval_runtime": 5.932, |
|
"eval_samples_per_second": 168.577, |
|
"eval_steps_per_second": 21.072, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9750086693357712, |
|
"eval_loss": 0.11021321266889572, |
|
"eval_macro_f1": 0.9267488028708639, |
|
"eval_macro_precision": 0.9153942226603791, |
|
"eval_macro_recall": 0.9386080517042859, |
|
"eval_runtime": 5.9689, |
|
"eval_samples_per_second": 167.536, |
|
"eval_steps_per_second": 20.942, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9760253459853094, |
|
"eval_loss": 0.11098870635032654, |
|
"eval_macro_f1": 0.9287954097228024, |
|
"eval_macro_precision": 0.9205523043756338, |
|
"eval_macro_recall": 0.9374208211553338, |
|
"eval_runtime": 5.9208, |
|
"eval_samples_per_second": 168.896, |
|
"eval_steps_per_second": 21.112, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9773021027079852, |
|
"eval_loss": 0.11490638554096222, |
|
"eval_macro_f1": 0.9321585507595793, |
|
"eval_macro_precision": 0.9266098427277691, |
|
"eval_macro_recall": 0.9378807443139501, |
|
"eval_runtime": 6.075, |
|
"eval_samples_per_second": 164.61, |
|
"eval_steps_per_second": 20.576, |
|
"step": 875 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4000, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 32, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"EarlyStoppingCallback": { |
|
"args": { |
|
"early_stopping_patience": 3, |
|
"early_stopping_threshold": 0.001 |
|
}, |
|
"attributes": { |
|
"early_stopping_patience_counter": 3 |
|
} |
|
}, |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 723885139142880.0, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": { |
|
"learning_rate": 6.150691546013236e-05, |
|
"per_device_train_batch_size": 8, |
|
"warmup_ratio": 0.014555287490025246, |
|
"weight_decay": 0.02919246813677108 |
|
} |
|
} |
|
|