xshubhamx's picture
Upload folder using huggingface_hub
6bca406 verified
{
"best_metric": 0.6460817297487148,
"best_model_checkpoint": "InLegalBERT-lora/checkpoint-2400",
"epoch": 14.930015552099533,
"eval_steps": 500,
"global_step": 2400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.6553059643687065,
"eval_f1_macro": 0.34196434919671853,
"eval_f1_micro": 0.6553059643687065,
"eval_f1_weighted": 0.6146575775654787,
"eval_loss": 1.2012524604797363,
"eval_macro_fpr": 0.036531607457408626,
"eval_macro_sensitivity": 0.39029268516816945,
"eval_macro_specificity": 0.9740627875145957,
"eval_precision": 0.6007307052856502,
"eval_precision_macro": 0.32788772117271575,
"eval_recall": 0.6553059643687065,
"eval_recall_macro": 0.39029268516816945,
"eval_runtime": 30.3344,
"eval_samples_per_second": 42.559,
"eval_steps_per_second": 5.34,
"eval_weighted_fpr": 0.03621124582960371,
"eval_weighted_sensitivity": 0.6553059643687065,
"eval_weighted_specificity": 0.9556358483502301,
"step": 160
},
{
"epoch": 2.0,
"eval_accuracy": 0.7381874515879163,
"eval_f1_macro": 0.4250111578260666,
"eval_f1_micro": 0.7381874515879164,
"eval_f1_weighted": 0.7236865886821344,
"eval_loss": 0.8278939127922058,
"eval_macro_fpr": 0.024763530819684316,
"eval_macro_sensitivity": 0.46578072689552413,
"eval_macro_specificity": 0.9806295017830671,
"eval_precision": 0.7211273477007717,
"eval_precision_macro": 0.40923635739063985,
"eval_recall": 0.7381874515879163,
"eval_recall_macro": 0.46578072689552413,
"eval_runtime": 34.091,
"eval_samples_per_second": 37.869,
"eval_steps_per_second": 4.752,
"eval_weighted_fpr": 0.024707602339181286,
"eval_weighted_sensitivity": 0.7381874515879163,
"eval_weighted_specificity": 0.9712550751580882,
"step": 321
},
{
"epoch": 3.0,
"eval_accuracy": 0.7544539116963594,
"eval_f1_macro": 0.44305220236653187,
"eval_f1_micro": 0.7544539116963594,
"eval_f1_weighted": 0.7304902543811719,
"eval_loss": 0.713018000125885,
"eval_macro_fpr": 0.0233195243156939,
"eval_macro_sensitivity": 0.4769897256873969,
"eval_macro_specificity": 0.9816367201302573,
"eval_precision": 0.7255238407846915,
"eval_precision_macro": 0.4800443784048848,
"eval_recall": 0.7544539116963594,
"eval_recall_macro": 0.4769897256873969,
"eval_runtime": 32.6151,
"eval_samples_per_second": 39.583,
"eval_steps_per_second": 4.967,
"eval_weighted_fpr": 0.02271912850283093,
"eval_weighted_sensitivity": 0.7544539116963594,
"eval_weighted_specificity": 0.9700968902575,
"step": 482
},
{
"epoch": 3.11,
"learning_rate": 3.958333333333333e-05,
"loss": 1.1985,
"step": 500
},
{
"epoch": 4.0,
"eval_accuracy": 0.7823392718822618,
"eval_f1_macro": 0.5047859025633034,
"eval_f1_micro": 0.7823392718822618,
"eval_f1_weighted": 0.766027283346833,
"eval_loss": 0.6922410726547241,
"eval_macro_fpr": 0.02001637486004151,
"eval_macro_sensitivity": 0.528327896933921,
"eval_macro_specificity": 0.9837585704961105,
"eval_precision": 0.7594430092765442,
"eval_precision_macro": 0.5188076394331661,
"eval_recall": 0.7823392718822618,
"eval_recall_macro": 0.528327896933921,
"eval_runtime": 32.5532,
"eval_samples_per_second": 39.658,
"eval_steps_per_second": 4.976,
"eval_weighted_fpr": 0.019485472574717427,
"eval_weighted_sensitivity": 0.7823392718822618,
"eval_weighted_specificity": 0.9740392855593933,
"step": 643
},
{
"epoch": 5.0,
"eval_accuracy": 0.7939581719597212,
"eval_f1_macro": 0.5257108179174788,
"eval_f1_micro": 0.7939581719597211,
"eval_f1_weighted": 0.7717932414170925,
"eval_loss": 0.6710420846939087,
"eval_macro_fpr": 0.018964580711785816,
"eval_macro_sensitivity": 0.5571328425020213,
"eval_macro_specificity": 0.9845265708178329,
"eval_precision": 0.7734327517428056,
"eval_precision_macro": 0.5449998556573111,
"eval_recall": 0.7939581719597212,
"eval_recall_macro": 0.5571328425020213,
"eval_runtime": 33.235,
"eval_samples_per_second": 38.845,
"eval_steps_per_second": 4.874,
"eval_weighted_fpr": 0.018199233716475097,
"eval_weighted_sensitivity": 0.7939581719597212,
"eval_weighted_specificity": 0.9739403903077732,
"step": 803
},
{
"epoch": 6.0,
"eval_accuracy": 0.7970565453137103,
"eval_f1_macro": 0.5316254099721903,
"eval_f1_micro": 0.7970565453137104,
"eval_f1_weighted": 0.7789523196246046,
"eval_loss": 0.6454855799674988,
"eval_macro_fpr": 0.018368947118040532,
"eval_macro_sensitivity": 0.5622105847462606,
"eval_macro_specificity": 0.9848273693754934,
"eval_precision": 0.7756987894676903,
"eval_precision_macro": 0.5353415355904975,
"eval_recall": 0.7970565453137103,
"eval_recall_macro": 0.5622105847462606,
"eval_runtime": 33.0425,
"eval_samples_per_second": 39.071,
"eval_steps_per_second": 4.903,
"eval_weighted_fpr": 0.017862012544314153,
"eval_weighted_sensitivity": 0.7970565453137103,
"eval_weighted_specificity": 0.9753539953186898,
"step": 964
},
{
"epoch": 6.22,
"learning_rate": 2.916666666666667e-05,
"loss": 0.5721,
"step": 1000
},
{
"epoch": 7.0,
"eval_accuracy": 0.8001549186676995,
"eval_f1_macro": 0.5486067787470349,
"eval_f1_micro": 0.8001549186676995,
"eval_f1_weighted": 0.7845126172395842,
"eval_loss": 0.6394562721252441,
"eval_macro_fpr": 0.01807650265580631,
"eval_macro_sensitivity": 0.5784319115133939,
"eval_macro_specificity": 0.9850891561725063,
"eval_precision": 0.7801018097427485,
"eval_precision_macro": 0.5442815357986059,
"eval_recall": 0.8001549186676995,
"eval_recall_macro": 0.5784319115133939,
"eval_runtime": 32.9727,
"eval_samples_per_second": 39.154,
"eval_steps_per_second": 4.913,
"eval_weighted_fpr": 0.017527173913043478,
"eval_weighted_sensitivity": 0.8001549186676995,
"eval_weighted_specificity": 0.9761824239198935,
"step": 1125
},
{
"epoch": 8.0,
"eval_accuracy": 0.8024786986831913,
"eval_f1_macro": 0.5474570084709011,
"eval_f1_micro": 0.8024786986831914,
"eval_f1_weighted": 0.787386582262622,
"eval_loss": 0.6317066550254822,
"eval_macro_fpr": 0.017822080148589308,
"eval_macro_sensitivity": 0.5773035410379497,
"eval_macro_specificity": 0.9852623885220758,
"eval_precision": 0.783268466071204,
"eval_precision_macro": 0.5438628735250125,
"eval_recall": 0.8024786986831913,
"eval_recall_macro": 0.5773035410379497,
"eval_runtime": 33.0187,
"eval_samples_per_second": 39.099,
"eval_steps_per_second": 4.906,
"eval_weighted_fpr": 0.017277593332881633,
"eval_weighted_sensitivity": 0.8024786986831913,
"eval_weighted_specificity": 0.9764571291479465,
"step": 1286
},
{
"epoch": 9.0,
"eval_accuracy": 0.8009295120061968,
"eval_f1_macro": 0.5609368334662593,
"eval_f1_micro": 0.8009295120061968,
"eval_f1_weighted": 0.7875081013739925,
"eval_loss": 0.6136514544487,
"eval_macro_fpr": 0.017931645431496272,
"eval_macro_sensitivity": 0.5841960959288544,
"eval_macro_specificity": 0.985161694874728,
"eval_precision": 0.7827917488346946,
"eval_precision_macro": 0.5593054718395108,
"eval_recall": 0.8009295120061968,
"eval_recall_macro": 0.5841960959288544,
"eval_runtime": 33.7216,
"eval_samples_per_second": 38.284,
"eval_steps_per_second": 4.804,
"eval_weighted_fpr": 0.017443833570895267,
"eval_weighted_sensitivity": 0.8009295120061968,
"eval_weighted_specificity": 0.9764959111147221,
"step": 1446
},
{
"epoch": 9.33,
"learning_rate": 1.8750000000000002e-05,
"loss": 0.4166,
"step": 1500
},
{
"epoch": 10.0,
"eval_accuracy": 0.8156467854376452,
"eval_f1_macro": 0.6305053806449583,
"eval_f1_micro": 0.8156467854376452,
"eval_f1_weighted": 0.8066651282863864,
"eval_loss": 0.6248635649681091,
"eval_macro_fpr": 0.016463869736407642,
"eval_macro_sensitivity": 0.6430050326236179,
"eval_macro_specificity": 0.9861908495694477,
"eval_precision": 0.8054630087428596,
"eval_precision_macro": 0.639776904615918,
"eval_recall": 0.8156467854376452,
"eval_recall_macro": 0.6430050326236179,
"eval_runtime": 33.5965,
"eval_samples_per_second": 38.427,
"eval_steps_per_second": 4.822,
"eval_weighted_fpr": 0.01588785046728972,
"eval_weighted_sensitivity": 0.8156467854376452,
"eval_weighted_specificity": 0.9772159581040682,
"step": 1607
},
{
"epoch": 11.0,
"eval_accuracy": 0.8125484120836561,
"eval_f1_macro": 0.6371983241862614,
"eval_f1_micro": 0.8125484120836561,
"eval_f1_weighted": 0.8042305582147614,
"eval_loss": 0.642641544342041,
"eval_macro_fpr": 0.016876700974845713,
"eval_macro_sensitivity": 0.6520338532213917,
"eval_macro_specificity": 0.9859193883690203,
"eval_precision": 0.8013591068710365,
"eval_precision_macro": 0.6397179331634546,
"eval_recall": 0.8125484120836561,
"eval_recall_macro": 0.6520338532213917,
"eval_runtime": 33.85,
"eval_samples_per_second": 38.139,
"eval_steps_per_second": 4.786,
"eval_weighted_fpr": 0.016211146838156484,
"eval_weighted_sensitivity": 0.8125484120836561,
"eval_weighted_specificity": 0.9762424134516496,
"step": 1768
},
{
"epoch": 12.0,
"eval_accuracy": 0.8164213787761425,
"eval_f1_macro": 0.6372154277689757,
"eval_f1_micro": 0.8164213787761425,
"eval_f1_weighted": 0.8082672837501724,
"eval_loss": 0.6305465698242188,
"eval_macro_fpr": 0.016428781045237314,
"eval_macro_sensitivity": 0.6526108250586471,
"eval_macro_specificity": 0.9862261630603141,
"eval_precision": 0.8050297561179627,
"eval_precision_macro": 0.635785837139922,
"eval_recall": 0.8164213787761425,
"eval_recall_macro": 0.6526108250586471,
"eval_runtime": 33.9194,
"eval_samples_per_second": 38.061,
"eval_steps_per_second": 4.776,
"eval_weighted_fpr": 0.01580737677582872,
"eval_weighted_sensitivity": 0.8164213787761425,
"eval_weighted_specificity": 0.9769710671285662,
"step": 1929
},
{
"epoch": 12.44,
"learning_rate": 8.333333333333334e-06,
"loss": 0.3406,
"step": 2000
},
{
"epoch": 13.0,
"eval_accuracy": 0.820294345468629,
"eval_f1_macro": 0.6352955893706947,
"eval_f1_micro": 0.8202943454686291,
"eval_f1_weighted": 0.8129160642124462,
"eval_loss": 0.6275700926780701,
"eval_macro_fpr": 0.015989017879060468,
"eval_macro_sensitivity": 0.6466831772856799,
"eval_macro_specificity": 0.9865122165499488,
"eval_precision": 0.8102004267117454,
"eval_precision_macro": 0.6417861741800394,
"eval_recall": 0.820294345468629,
"eval_recall_macro": 0.6466831772856799,
"eval_runtime": 32.8101,
"eval_samples_per_second": 39.348,
"eval_steps_per_second": 4.938,
"eval_weighted_fpr": 0.015407092575375215,
"eval_weighted_sensitivity": 0.820294345468629,
"eval_weighted_specificity": 0.9773889027806014,
"step": 2089
},
{
"epoch": 14.0,
"eval_accuracy": 0.8187451587916343,
"eval_f1_macro": 0.6446278757638214,
"eval_f1_micro": 0.8187451587916342,
"eval_f1_weighted": 0.81074292931159,
"eval_loss": 0.6428066492080688,
"eval_macro_fpr": 0.016186760254085688,
"eval_macro_sensitivity": 0.6618493798882754,
"eval_macro_specificity": 0.9863911143208972,
"eval_precision": 0.8079041434352637,
"eval_precision_macro": 0.6466770185879867,
"eval_recall": 0.8187451587916343,
"eval_recall_macro": 0.6618493798882754,
"eval_runtime": 32.4757,
"eval_samples_per_second": 39.753,
"eval_steps_per_second": 4.988,
"eval_weighted_fpr": 0.015566790846194785,
"eval_weighted_sensitivity": 0.8187451587916343,
"eval_weighted_specificity": 0.9771215560218227,
"step": 2250
},
{
"epoch": 14.93,
"eval_accuracy": 0.820294345468629,
"eval_f1_macro": 0.6460817297487148,
"eval_f1_micro": 0.8202943454686291,
"eval_f1_weighted": 0.8125066936495612,
"eval_loss": 0.634365439414978,
"eval_macro_fpr": 0.016027569664931556,
"eval_macro_sensitivity": 0.6624718661648383,
"eval_macro_specificity": 0.9864925668028308,
"eval_precision": 0.8092174819516477,
"eval_precision_macro": 0.6486629857671901,
"eval_recall": 0.820294345468629,
"eval_recall_macro": 0.6624718661648383,
"eval_runtime": 32.8393,
"eval_samples_per_second": 39.313,
"eval_steps_per_second": 4.933,
"eval_weighted_fpr": 0.015407092575375215,
"eval_weighted_sensitivity": 0.820294345468629,
"eval_weighted_specificity": 0.9770941565738336,
"step": 2400
}
],
"logging_steps": 500,
"max_steps": 2400,
"num_train_epochs": 15,
"save_steps": 500,
"total_flos": 2.082121538560819e+16,
"trial_name": null,
"trial_params": null
}