| { | |
| "best_metric": 0.6528931773500395, | |
| "best_model_checkpoint": "case-analysis-bert-base-uncased/checkpoint-2912", | |
| "epoch": 22.0, | |
| "eval_steps": 500, | |
| "global_step": 4928, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "eval_accuracy": 0.7861915367483296, | |
| "eval_f1_macro": 0.5606209513919795, | |
| "eval_f1_micro": 0.7861915367483298, | |
| "eval_f1_weighted": 0.7596863457967054, | |
| "eval_loss": 0.7283128499984741, | |
| "eval_macro_fpr": 0.1142150114777894, | |
| "eval_macro_sensitivity": 0.5571958513134984, | |
| "eval_macro_specificity": 0.8974437739369907, | |
| "eval_precision": 0.7487100743874461, | |
| "eval_precision_macro": 0.584767668299669, | |
| "eval_recall": 0.7861915367483296, | |
| "eval_recall_macro": 0.5571958513134984, | |
| "eval_runtime": 9.7006, | |
| "eval_samples_per_second": 46.286, | |
| "eval_steps_per_second": 5.876, | |
| "eval_weighted_fpr": 0.08311688311688312, | |
| "eval_weighted_sensitivity": 0.7861915367483296, | |
| "eval_weighted_specificity": 0.8035835589996332, | |
| "step": 224 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_accuracy": 0.799554565701559, | |
| "eval_f1_macro": 0.5913567856292314, | |
| "eval_f1_micro": 0.799554565701559, | |
| "eval_f1_weighted": 0.7794312570974847, | |
| "eval_loss": 0.816001296043396, | |
| "eval_macro_fpr": 0.09972743460349152, | |
| "eval_macro_sensitivity": 0.6065148418089594, | |
| "eval_macro_specificity": 0.910318444398066, | |
| "eval_precision": 0.7603126937076594, | |
| "eval_precision_macro": 0.5769576335614072, | |
| "eval_recall": 0.799554565701559, | |
| "eval_recall_macro": 0.6065148418089594, | |
| "eval_runtime": 39.2963, | |
| "eval_samples_per_second": 11.426, | |
| "eval_steps_per_second": 1.451, | |
| "eval_weighted_fpr": 0.07712082262210797, | |
| "eval_weighted_sensitivity": 0.799554565701559, | |
| "eval_weighted_specificity": 0.8417192118907049, | |
| "step": 448 | |
| }, | |
| { | |
| "epoch": 2.232142857142857, | |
| "grad_norm": 10.089143753051758, | |
| "learning_rate": 4.6302083333333335e-05, | |
| "loss": 0.6512, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_accuracy": 0.7906458797327395, | |
| "eval_f1_macro": 0.5840451851613266, | |
| "eval_f1_micro": 0.7906458797327395, | |
| "eval_f1_weighted": 0.771952482046502, | |
| "eval_loss": 0.8587548136711121, | |
| "eval_macro_fpr": 0.10045553338392213, | |
| "eval_macro_sensitivity": 0.5989408048231577, | |
| "eval_macro_specificity": 0.9104668136432382, | |
| "eval_precision": 0.7597703984690992, | |
| "eval_precision_macro": 0.5770004879708264, | |
| "eval_recall": 0.7906458797327395, | |
| "eval_recall_macro": 0.5989408048231577, | |
| "eval_runtime": 36.0068, | |
| "eval_samples_per_second": 12.47, | |
| "eval_steps_per_second": 1.583, | |
| "eval_weighted_fpr": 0.0811044003451251, | |
| "eval_weighted_sensitivity": 0.7906458797327395, | |
| "eval_weighted_specificity": 0.8512213748402133, | |
| "step": 672 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_accuracy": 0.7817371937639198, | |
| "eval_f1_macro": 0.6299493260025852, | |
| "eval_f1_micro": 0.7817371937639198, | |
| "eval_f1_weighted": 0.7804892003577936, | |
| "eval_loss": 1.0820659399032593, | |
| "eval_macro_fpr": 0.09955325556886446, | |
| "eval_macro_sensitivity": 0.6429130620307091, | |
| "eval_macro_specificity": 0.9124114631310538, | |
| "eval_precision": 0.7819490155060428, | |
| "eval_precision_macro": 0.6213857962213225, | |
| "eval_recall": 0.7817371937639198, | |
| "eval_recall_macro": 0.6429130620307091, | |
| "eval_runtime": 32.7545, | |
| "eval_samples_per_second": 13.708, | |
| "eval_steps_per_second": 1.74, | |
| "eval_weighted_fpr": 0.08514335360556038, | |
| "eval_weighted_sensitivity": 0.7817371937639198, | |
| "eval_weighted_specificity": 0.8679086587602954, | |
| "step": 896 | |
| }, | |
| { | |
| "epoch": 4.464285714285714, | |
| "grad_norm": 0.3640059232711792, | |
| "learning_rate": 4.258184523809524e-05, | |
| "loss": 0.3466, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_accuracy": 0.8084632516703786, | |
| "eval_f1_macro": 0.619470115868435, | |
| "eval_f1_micro": 0.8084632516703786, | |
| "eval_f1_weighted": 0.7927603955642376, | |
| "eval_loss": 1.0612273216247559, | |
| "eval_macro_fpr": 0.09480480467421379, | |
| "eval_macro_sensitivity": 0.6262706556824204, | |
| "eval_macro_specificity": 0.9138770264258179, | |
| "eval_precision": 0.7999415514782998, | |
| "eval_precision_macro": 0.7128659611992946, | |
| "eval_recall": 0.8084632516703786, | |
| "eval_recall_macro": 0.6262706556824204, | |
| "eval_runtime": 34.7281, | |
| "eval_samples_per_second": 12.929, | |
| "eval_steps_per_second": 1.641, | |
| "eval_weighted_fpr": 0.07319148936170213, | |
| "eval_weighted_sensitivity": 0.8084632516703786, | |
| "eval_weighted_specificity": 0.847044854032893, | |
| "step": 1120 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_accuracy": 0.7928730512249443, | |
| "eval_f1_macro": 0.6273476992208005, | |
| "eval_f1_micro": 0.7928730512249443, | |
| "eval_f1_weighted": 0.7896519709076985, | |
| "eval_loss": 1.2559400796890259, | |
| "eval_macro_fpr": 0.09508832825281638, | |
| "eval_macro_sensitivity": 0.6361528640940406, | |
| "eval_macro_specificity": 0.9161350599199577, | |
| "eval_precision": 0.7876580739535682, | |
| "eval_precision_macro": 0.6205792331164909, | |
| "eval_recall": 0.7928730512249443, | |
| "eval_recall_macro": 0.6361528640940406, | |
| "eval_runtime": 38.0322, | |
| "eval_samples_per_second": 11.806, | |
| "eval_steps_per_second": 1.499, | |
| "eval_weighted_fpr": 0.08010335917312661, | |
| "eval_weighted_sensitivity": 0.7928730512249443, | |
| "eval_weighted_specificity": 0.8716671884548861, | |
| "step": 1344 | |
| }, | |
| { | |
| "epoch": 6.696428571428571, | |
| "grad_norm": 0.05509716644883156, | |
| "learning_rate": 3.8869047619047625e-05, | |
| "loss": 0.1715, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_accuracy": 0.7928730512249443, | |
| "eval_f1_macro": 0.623650691198171, | |
| "eval_f1_micro": 0.7928730512249443, | |
| "eval_f1_weighted": 0.7892792124992886, | |
| "eval_loss": 1.3700848817825317, | |
| "eval_macro_fpr": 0.09905686727492574, | |
| "eval_macro_sensitivity": 0.6178801987625516, | |
| "eval_macro_specificity": 0.9121558558439, | |
| "eval_precision": 0.7889374292245007, | |
| "eval_precision_macro": 0.6344745555953697, | |
| "eval_recall": 0.7928730512249443, | |
| "eval_recall_macro": 0.6178801987625516, | |
| "eval_runtime": 38.6276, | |
| "eval_samples_per_second": 11.624, | |
| "eval_steps_per_second": 1.476, | |
| "eval_weighted_fpr": 0.08010335917312661, | |
| "eval_weighted_sensitivity": 0.7928730512249443, | |
| "eval_weighted_specificity": 0.8557503721506562, | |
| "step": 1568 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_accuracy": 0.8106904231625836, | |
| "eval_f1_macro": 0.6464437798898967, | |
| "eval_f1_micro": 0.8106904231625834, | |
| "eval_f1_weighted": 0.8064189899649085, | |
| "eval_loss": 1.4005118608474731, | |
| "eval_macro_fpr": 0.0921754708102674, | |
| "eval_macro_sensitivity": 0.6370398282162988, | |
| "eval_macro_specificity": 0.9178527413440807, | |
| "eval_precision": 0.8034816923327339, | |
| "eval_precision_macro": 0.6578060011883542, | |
| "eval_recall": 0.8106904231625836, | |
| "eval_recall_macro": 0.6370398282162988, | |
| "eval_runtime": 35.6698, | |
| "eval_samples_per_second": 12.588, | |
| "eval_steps_per_second": 1.598, | |
| "eval_weighted_fpr": 0.07221750212404418, | |
| "eval_weighted_sensitivity": 0.8106904231625836, | |
| "eval_weighted_specificity": 0.860720542213739, | |
| "step": 1792 | |
| }, | |
| { | |
| "epoch": 8.928571428571429, | |
| "grad_norm": 0.005432427860796452, | |
| "learning_rate": 3.514880952380952e-05, | |
| "loss": 0.0636, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_accuracy": 0.8017817371937639, | |
| "eval_f1_macro": 0.6263115408785538, | |
| "eval_f1_micro": 0.8017817371937639, | |
| "eval_f1_weighted": 0.7896240754364972, | |
| "eval_loss": 1.473650336265564, | |
| "eval_macro_fpr": 0.10259295399855256, | |
| "eval_macro_sensitivity": 0.6149052987288282, | |
| "eval_macro_specificity": 0.9072211454744684, | |
| "eval_precision": 0.788055851480147, | |
| "eval_precision_macro": 0.6582800876341822, | |
| "eval_recall": 0.8017817371937639, | |
| "eval_recall_macro": 0.6149052987288282, | |
| "eval_runtime": 34.11, | |
| "eval_samples_per_second": 13.163, | |
| "eval_steps_per_second": 1.671, | |
| "eval_weighted_fpr": 0.07613344739093242, | |
| "eval_weighted_sensitivity": 0.8017817371937639, | |
| "eval_weighted_specificity": 0.8271028447041098, | |
| "step": 2016 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "eval_accuracy": 0.7884187082405345, | |
| "eval_f1_macro": 0.6331690370327951, | |
| "eval_f1_micro": 0.7884187082405345, | |
| "eval_f1_weighted": 0.7909426185077314, | |
| "eval_loss": 1.7568920850753784, | |
| "eval_macro_fpr": 0.09595908153187079, | |
| "eval_macro_sensitivity": 0.6428373560726501, | |
| "eval_macro_specificity": 0.91584307980206, | |
| "eval_precision": 0.7961677526311304, | |
| "eval_precision_macro": 0.6275270485563467, | |
| "eval_recall": 0.7884187082405345, | |
| "eval_recall_macro": 0.6428373560726501, | |
| "eval_runtime": 42.7436, | |
| "eval_samples_per_second": 10.504, | |
| "eval_steps_per_second": 1.334, | |
| "eval_weighted_fpr": 0.08210890233362143, | |
| "eval_weighted_sensitivity": 0.7884187082405345, | |
| "eval_weighted_specificity": 0.8749536109677053, | |
| "step": 2240 | |
| }, | |
| { | |
| "epoch": 11.0, | |
| "eval_accuracy": 0.7906458797327395, | |
| "eval_f1_macro": 0.6101321036639349, | |
| "eval_f1_micro": 0.7906458797327395, | |
| "eval_f1_weighted": 0.7845175231806186, | |
| "eval_loss": 1.7140623331069946, | |
| "eval_macro_fpr": 0.1035198920558284, | |
| "eval_macro_sensitivity": 0.6082973730032554, | |
| "eval_macro_specificity": 0.9082706582818566, | |
| "eval_precision": 0.7824040660397941, | |
| "eval_precision_macro": 0.6165716760629552, | |
| "eval_recall": 0.7906458797327395, | |
| "eval_recall_macro": 0.6082973730032554, | |
| "eval_runtime": 37.438, | |
| "eval_samples_per_second": 11.993, | |
| "eval_steps_per_second": 1.523, | |
| "eval_weighted_fpr": 0.0811044003451251, | |
| "eval_weighted_sensitivity": 0.7906458797327395, | |
| "eval_weighted_specificity": 0.842436753394687, | |
| "step": 2464 | |
| }, | |
| { | |
| "epoch": 11.160714285714286, | |
| "grad_norm": 0.0017704592319205403, | |
| "learning_rate": 3.142857142857143e-05, | |
| "loss": 0.0159, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 12.0, | |
| "eval_accuracy": 0.7951002227171492, | |
| "eval_f1_macro": 0.6372747490500124, | |
| "eval_f1_micro": 0.7951002227171492, | |
| "eval_f1_weighted": 0.7916670590899947, | |
| "eval_loss": 1.714410662651062, | |
| "eval_macro_fpr": 0.09685632952239012, | |
| "eval_macro_sensitivity": 0.6412759206876854, | |
| "eval_macro_specificity": 0.9140152346037369, | |
| "eval_precision": 0.7913770752065027, | |
| "eval_precision_macro": 0.6393393002684569, | |
| "eval_recall": 0.7951002227171492, | |
| "eval_recall_macro": 0.6412759206876854, | |
| "eval_runtime": 34.7517, | |
| "eval_samples_per_second": 12.92, | |
| "eval_steps_per_second": 1.64, | |
| "eval_weighted_fpr": 0.07910576096302666, | |
| "eval_weighted_sensitivity": 0.7951002227171492, | |
| "eval_weighted_specificity": 0.8609607156977986, | |
| "step": 2688 | |
| }, | |
| { | |
| "epoch": 13.0, | |
| "eval_accuracy": 0.799554565701559, | |
| "eval_f1_macro": 0.6528931773500395, | |
| "eval_f1_micro": 0.799554565701559, | |
| "eval_f1_weighted": 0.798188843376642, | |
| "eval_loss": 1.7243342399597168, | |
| "eval_macro_fpr": 0.09420589017594908, | |
| "eval_macro_sensitivity": 0.6525655716832187, | |
| "eval_macro_specificity": 0.9158469519501292, | |
| "eval_precision": 0.7968817042081011, | |
| "eval_precision_macro": 0.6534600751896625, | |
| "eval_recall": 0.799554565701559, | |
| "eval_recall_macro": 0.6525655716832187, | |
| "eval_runtime": 35.7184, | |
| "eval_samples_per_second": 12.571, | |
| "eval_steps_per_second": 1.596, | |
| "eval_weighted_fpr": 0.07712082262210797, | |
| "eval_weighted_sensitivity": 0.799554565701559, | |
| "eval_weighted_specificity": 0.8638332420989578, | |
| "step": 2912 | |
| }, | |
| { | |
| "epoch": 13.392857142857142, | |
| "grad_norm": 0.0014869036385789514, | |
| "learning_rate": 2.7708333333333337e-05, | |
| "loss": 0.0043, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 14.0, | |
| "eval_accuracy": 0.7973273942093542, | |
| "eval_f1_macro": 0.6334742709127367, | |
| "eval_f1_micro": 0.7973273942093542, | |
| "eval_f1_weighted": 0.7911632678226206, | |
| "eval_loss": 1.8550578355789185, | |
| "eval_macro_fpr": 0.10413380473626513, | |
| "eval_macro_sensitivity": 0.6189159939159938, | |
| "eval_macro_specificity": 0.9071845213512801, | |
| "eval_precision": 0.7948329741898784, | |
| "eval_precision_macro": 0.6575689935064936, | |
| "eval_recall": 0.7973273942093542, | |
| "eval_recall_macro": 0.6189159939159938, | |
| "eval_runtime": 37.3063, | |
| "eval_samples_per_second": 12.035, | |
| "eval_steps_per_second": 1.528, | |
| "eval_weighted_fpr": 0.07811158798283262, | |
| "eval_weighted_sensitivity": 0.7973273942093542, | |
| "eval_weighted_specificity": 0.8314106911957669, | |
| "step": 3136 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "eval_accuracy": 0.7928730512249443, | |
| "eval_f1_macro": 0.6104462132353847, | |
| "eval_f1_micro": 0.7928730512249443, | |
| "eval_f1_weighted": 0.7860581271310794, | |
| "eval_loss": 1.8840636014938354, | |
| "eval_macro_fpr": 0.10077968846838097, | |
| "eval_macro_sensitivity": 0.616244778009484, | |
| "eval_macro_specificity": 0.9109811795750432, | |
| "eval_precision": 0.7868702804113628, | |
| "eval_precision_macro": 0.6153843681293956, | |
| "eval_recall": 0.7928730512249443, | |
| "eval_recall_macro": 0.616244778009484, | |
| "eval_runtime": 37.5124, | |
| "eval_samples_per_second": 11.969, | |
| "eval_steps_per_second": 1.519, | |
| "eval_weighted_fpr": 0.08010335917312661, | |
| "eval_weighted_sensitivity": 0.7928730512249443, | |
| "eval_weighted_specificity": 0.8510516670752286, | |
| "step": 3360 | |
| }, | |
| { | |
| "epoch": 15.625, | |
| "grad_norm": 0.0012946381466463208, | |
| "learning_rate": 2.3995535714285717e-05, | |
| "loss": 0.0029, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 16.0, | |
| "eval_accuracy": 0.755011135857461, | |
| "eval_f1_macro": 0.6015295009953532, | |
| "eval_f1_micro": 0.755011135857461, | |
| "eval_f1_weighted": 0.7660603471590911, | |
| "eval_loss": 2.0852534770965576, | |
| "eval_macro_fpr": 0.1100287944234454, | |
| "eval_macro_sensitivity": 0.6118684574566927, | |
| "eval_macro_specificity": 0.9061965043355904, | |
| "eval_precision": 0.7837194577525304, | |
| "eval_precision_macro": 0.6010349959287868, | |
| "eval_recall": 0.755011135857461, | |
| "eval_recall_macro": 0.6118684574566927, | |
| "eval_runtime": 40.7827, | |
| "eval_samples_per_second": 11.01, | |
| "eval_steps_per_second": 1.398, | |
| "eval_weighted_fpr": 0.09760425909494233, | |
| "eval_weighted_sensitivity": 0.755011135857461, | |
| "eval_weighted_specificity": 0.8697748814849007, | |
| "step": 3584 | |
| }, | |
| { | |
| "epoch": 17.0, | |
| "eval_accuracy": 0.7839643652561247, | |
| "eval_f1_macro": 0.5916565481092323, | |
| "eval_f1_micro": 0.7839643652561247, | |
| "eval_f1_weighted": 0.7797414440266076, | |
| "eval_loss": 1.9721872806549072, | |
| "eval_macro_fpr": 0.10755611089319247, | |
| "eval_macro_sensitivity": 0.5838615544497898, | |
| "eval_macro_specificity": 0.9058507118814452, | |
| "eval_precision": 0.7783473447757774, | |
| "eval_precision_macro": 0.6018491347401939, | |
| "eval_recall": 0.7839643652561247, | |
| "eval_recall_macro": 0.5838615544497898, | |
| "eval_runtime": 39.509, | |
| "eval_samples_per_second": 11.365, | |
| "eval_steps_per_second": 1.443, | |
| "eval_weighted_fpr": 0.08412836079791847, | |
| "eval_weighted_sensitivity": 0.7839643652561247, | |
| "eval_weighted_specificity": 0.839438482269656, | |
| "step": 3808 | |
| }, | |
| { | |
| "epoch": 17.857142857142858, | |
| "grad_norm": 0.0011545266024768353, | |
| "learning_rate": 2.027529761904762e-05, | |
| "loss": 0.0071, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 18.0, | |
| "eval_accuracy": 0.799554565701559, | |
| "eval_f1_macro": 0.5960313624746896, | |
| "eval_f1_micro": 0.799554565701559, | |
| "eval_f1_weighted": 0.7840137565459063, | |
| "eval_loss": 1.873466968536377, | |
| "eval_macro_fpr": 0.10533282331246058, | |
| "eval_macro_sensitivity": 0.5916575475399004, | |
| "eval_macro_specificity": 0.9047142410835605, | |
| "eval_precision": 0.7783001729348953, | |
| "eval_precision_macro": 0.6085738092705436, | |
| "eval_recall": 0.799554565701559, | |
| "eval_recall_macro": 0.5916575475399004, | |
| "eval_runtime": 42.6376, | |
| "eval_samples_per_second": 10.531, | |
| "eval_steps_per_second": 1.337, | |
| "eval_weighted_fpr": 0.07712082262210797, | |
| "eval_weighted_sensitivity": 0.799554565701559, | |
| "eval_weighted_specificity": 0.819302398632683, | |
| "step": 4032 | |
| }, | |
| { | |
| "epoch": 19.0, | |
| "eval_accuracy": 0.8017817371937639, | |
| "eval_f1_macro": 0.6000566425748908, | |
| "eval_f1_micro": 0.8017817371937639, | |
| "eval_f1_weighted": 0.7894612476993438, | |
| "eval_loss": 1.8293864727020264, | |
| "eval_macro_fpr": 0.10248664637782996, | |
| "eval_macro_sensitivity": 0.5942573589632414, | |
| "eval_macro_specificity": 0.9081532391165263, | |
| "eval_precision": 0.783975414299672, | |
| "eval_precision_macro": 0.6113679316195262, | |
| "eval_recall": 0.8017817371937639, | |
| "eval_recall_macro": 0.5942573589632414, | |
| "eval_runtime": 39.1005, | |
| "eval_samples_per_second": 11.483, | |
| "eval_steps_per_second": 1.458, | |
| "eval_weighted_fpr": 0.07613344739093242, | |
| "eval_weighted_sensitivity": 0.8017817371937639, | |
| "eval_weighted_specificity": 0.8308312192723414, | |
| "step": 4256 | |
| }, | |
| { | |
| "epoch": 20.0, | |
| "eval_accuracy": 0.7973273942093542, | |
| "eval_f1_macro": 0.6285046967011023, | |
| "eval_f1_micro": 0.7973273942093542, | |
| "eval_f1_weighted": 0.7941797156806406, | |
| "eval_loss": 1.8577601909637451, | |
| "eval_macro_fpr": 0.09902815238438424, | |
| "eval_macro_sensitivity": 0.6232260717554835, | |
| "eval_macro_specificity": 0.9117572211656928, | |
| "eval_precision": 0.7938657405716162, | |
| "eval_precision_macro": 0.636714448785387, | |
| "eval_recall": 0.7973273942093542, | |
| "eval_recall_macro": 0.6232260717554835, | |
| "eval_runtime": 44.7659, | |
| "eval_samples_per_second": 10.03, | |
| "eval_steps_per_second": 1.273, | |
| "eval_weighted_fpr": 0.07811158798283262, | |
| "eval_weighted_sensitivity": 0.7973273942093542, | |
| "eval_weighted_specificity": 0.8497014904534173, | |
| "step": 4480 | |
| }, | |
| { | |
| "epoch": 20.089285714285715, | |
| "grad_norm": 0.0009593501454219222, | |
| "learning_rate": 1.6555059523809523e-05, | |
| "loss": 0.0049, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 21.0, | |
| "eval_accuracy": 0.7973273942093542, | |
| "eval_f1_macro": 0.6285046967011023, | |
| "eval_f1_micro": 0.7973273942093542, | |
| "eval_f1_weighted": 0.7941797156806406, | |
| "eval_loss": 1.8769508600234985, | |
| "eval_macro_fpr": 0.09902815238438424, | |
| "eval_macro_sensitivity": 0.6232260717554835, | |
| "eval_macro_specificity": 0.9117572211656928, | |
| "eval_precision": 0.7938657405716162, | |
| "eval_precision_macro": 0.636714448785387, | |
| "eval_recall": 0.7973273942093542, | |
| "eval_recall_macro": 0.6232260717554835, | |
| "eval_runtime": 38.5375, | |
| "eval_samples_per_second": 11.651, | |
| "eval_steps_per_second": 1.479, | |
| "eval_weighted_fpr": 0.07811158798283262, | |
| "eval_weighted_sensitivity": 0.7973273942093542, | |
| "eval_weighted_specificity": 0.8497014904534173, | |
| "step": 4704 | |
| }, | |
| { | |
| "epoch": 22.0, | |
| "eval_accuracy": 0.7951002227171492, | |
| "eval_f1_macro": 0.615484044892805, | |
| "eval_f1_micro": 0.7951002227171492, | |
| "eval_f1_weighted": 0.7900289393227489, | |
| "eval_loss": 1.8931797742843628, | |
| "eval_macro_fpr": 0.10072490056374342, | |
| "eval_macro_sensitivity": 0.6118624353918471, | |
| "eval_macro_specificity": 0.9103064506905846, | |
| "eval_precision": 0.7876199411756162, | |
| "eval_precision_macro": 0.6219132429554252, | |
| "eval_recall": 0.7951002227171492, | |
| "eval_recall_macro": 0.6118624353918471, | |
| "eval_runtime": 42.2273, | |
| "eval_samples_per_second": 10.633, | |
| "eval_steps_per_second": 1.35, | |
| "eval_weighted_fpr": 0.07910576096302666, | |
| "eval_weighted_sensitivity": 0.7951002227171492, | |
| "eval_weighted_specificity": 0.8461255800451891, | |
| "step": 4928 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 6720, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 30, | |
| "save_steps": 500, | |
| "total_flos": 1.0373076514504704e+16, | |
| "train_batch_size": 8, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |