File size: 4,818 Bytes
1232351 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 |
{
"best_metric": 0.863960065934798,
"best_model_checkpoint": "tmp_ner_fantastic-bale-09_44/run-61/checkpoint-675",
"epoch": 9.0,
"eval_steps": 500,
"global_step": 675,
"is_hyper_param_search": true,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.9783235867446394,
"eval_loss": 0.06952951103448868,
"eval_macro_f1": 0.6359234331864915,
"eval_macro_precision": 0.8484880913225343,
"eval_macro_recall": 0.621665816946364,
"eval_runtime": 0.6216,
"eval_samples_per_second": 160.873,
"eval_steps_per_second": 20.913,
"step": 75
},
{
"epoch": 2.0,
"eval_accuracy": 0.983391812865497,
"eval_loss": 0.056511040776968,
"eval_macro_f1": 0.7614548378523822,
"eval_macro_precision": 0.8731710257534685,
"eval_macro_recall": 0.7203600182300229,
"eval_runtime": 0.6015,
"eval_samples_per_second": 166.249,
"eval_steps_per_second": 21.612,
"step": 150
},
{
"epoch": 3.0,
"eval_accuracy": 0.9857309941520468,
"eval_loss": 0.05191269889473915,
"eval_macro_f1": 0.8172545857097553,
"eval_macro_precision": 0.8413749539052772,
"eval_macro_recall": 0.7970101814719535,
"eval_runtime": 0.6777,
"eval_samples_per_second": 147.557,
"eval_steps_per_second": 19.182,
"step": 225
},
{
"epoch": 4.0,
"eval_accuracy": 0.9871734892787525,
"eval_loss": 0.055695317685604095,
"eval_macro_f1": 0.8405769067306196,
"eval_macro_precision": 0.8557959065634769,
"eval_macro_recall": 0.8269452880439045,
"eval_runtime": 0.6377,
"eval_samples_per_second": 156.826,
"eval_steps_per_second": 20.387,
"step": 300
},
{
"epoch": 5.0,
"eval_accuracy": 0.9875243664717349,
"eval_loss": 0.055003080517053604,
"eval_macro_f1": 0.8540405601187896,
"eval_macro_precision": 0.8983484203175353,
"eval_macro_recall": 0.8221656291922347,
"eval_runtime": 0.6394,
"eval_samples_per_second": 156.406,
"eval_steps_per_second": 20.333,
"step": 375
},
{
"epoch": 6.0,
"eval_accuracy": 0.9878362573099415,
"eval_loss": 0.060502711683511734,
"eval_macro_f1": 0.8610460620824656,
"eval_macro_precision": 0.8865353357904526,
"eval_macro_recall": 0.8387695106889209,
"eval_runtime": 0.6171,
"eval_samples_per_second": 162.056,
"eval_steps_per_second": 21.067,
"step": 450
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.02602095529437065,
"learning_rate": 3.3881089787380476e-05,
"loss": 0.08,
"step": 500
},
{
"epoch": 7.0,
"eval_accuracy": 0.9864327485380117,
"eval_loss": 0.06403131783008575,
"eval_macro_f1": 0.836324040811885,
"eval_macro_precision": 0.8309543877948833,
"eval_macro_recall": 0.8430665699031182,
"eval_runtime": 0.6657,
"eval_samples_per_second": 150.212,
"eval_steps_per_second": 19.528,
"step": 525
},
{
"epoch": 8.0,
"eval_accuracy": 0.9874463937621832,
"eval_loss": 0.06809797883033752,
"eval_macro_f1": 0.853127015308474,
"eval_macro_precision": 0.871470843170948,
"eval_macro_recall": 0.8370896203600997,
"eval_runtime": 0.6629,
"eval_samples_per_second": 150.862,
"eval_steps_per_second": 19.612,
"step": 600
},
{
"epoch": 9.0,
"eval_accuracy": 0.9883040935672515,
"eval_loss": 0.06698578596115112,
"eval_macro_f1": 0.863960065934798,
"eval_macro_precision": 0.8939098518285944,
"eval_macro_recall": 0.8388049073611367,
"eval_runtime": 0.6334,
"eval_samples_per_second": 157.89,
"eval_steps_per_second": 20.526,
"step": 675
}
],
"logging_steps": 500,
"max_steps": 2400,
"num_input_tokens_seen": 0,
"num_train_epochs": 32,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 3,
"early_stopping_threshold": 0.001
},
"attributes": {
"early_stopping_patience_counter": 0
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 768333841626390.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": {
"learning_rate": 4.2369194386745274e-05,
"per_device_train_batch_size": 8,
"warmup_ratio": 0.009641097927077978,
"weight_decay": 0.11095292966544487
}
}
|