|
{ |
|
"best_metric": 0.9063403443920213, |
|
"best_model_checkpoint": "./saved_models/climamba_prompt_sbdh_gpt4_v2_0/checkpoint-192", |
|
"epoch": 8.0, |
|
"eval_steps": 500, |
|
"global_step": 192, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 2.0851898193359375, |
|
"learning_rate": 0.0003, |
|
"loss": 1.4049, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_acc_macro": 0.05554596988321858, |
|
"eval_acc_micro": 0.17600550017187433, |
|
"eval_auc_macro": 0.6058912515968368, |
|
"eval_auc_micro": 0.6488212280527301, |
|
"eval_f1_at_5": 0.25079507780987353, |
|
"eval_f1_at_8": 0.24432286984749932, |
|
"eval_f1_macro": 0.09066299141125865, |
|
"eval_f1_micro": 0.2993276819643204, |
|
"eval_loss": 0.394575834274292, |
|
"eval_prec_at_5": 0.16187214611872147, |
|
"eval_prec_at_8": 0.1436929223744292, |
|
"eval_prec_macro": 0.05666691972017087, |
|
"eval_prec_micro": 0.23115124153497826, |
|
"eval_rec_at_5": 0.5565068493150684, |
|
"eval_rec_at_8": 0.8152587519025876, |
|
"eval_rec_macro": 0.22834645669278442, |
|
"eval_rec_micro": 0.4245439469319714, |
|
"eval_runtime": 6.3514, |
|
"eval_samples_per_second": 137.922, |
|
"eval_steps_per_second": 17.319, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 0.4896126985549927, |
|
"learning_rate": 0.0003, |
|
"loss": 0.3397, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_acc_macro": 0.5307003853873716, |
|
"eval_acc_micro": 0.5814606741572625, |
|
"eval_auc_macro": 0.9303990338907523, |
|
"eval_auc_micro": 0.9371828621061181, |
|
"eval_f1_at_5": 0.4088221844905389, |
|
"eval_f1_at_8": 0.28901449364842885, |
|
"eval_f1_macro": 0.6465579930529745, |
|
"eval_f1_micro": 0.7353463587921194, |
|
"eval_loss": 0.18900679051876068, |
|
"eval_prec_at_5": 0.2614155251141553, |
|
"eval_prec_at_8": 0.16980593607305935, |
|
"eval_prec_macro": 0.7313857838097021, |
|
"eval_prec_micro": 0.7915869980878784, |
|
"eval_rec_at_5": 0.9374048706240486, |
|
"eval_rec_at_8": 0.9699391171993911, |
|
"eval_rec_macro": 0.6410238611610916, |
|
"eval_rec_micro": 0.6865671641790475, |
|
"eval_runtime": 6.4111, |
|
"eval_samples_per_second": 136.637, |
|
"eval_steps_per_second": 17.158, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 0.1705099642276764, |
|
"learning_rate": 0.0003, |
|
"loss": 0.0916, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_acc_macro": 0.8244239681810236, |
|
"eval_acc_micro": 0.8311011904761286, |
|
"eval_auc_macro": 0.9919756925761466, |
|
"eval_auc_micro": 0.9920428839397825, |
|
"eval_f1_at_5": 0.42784762619628447, |
|
"eval_f1_at_8": 0.29274329072668936, |
|
"eval_f1_macro": 0.9019972941167671, |
|
"eval_f1_micro": 0.907761072734587, |
|
"eval_loss": 0.0666864886879921, |
|
"eval_prec_at_5": 0.273972602739726, |
|
"eval_prec_at_8": 0.1720890410958904, |
|
"eval_prec_macro": 0.8888004919536745, |
|
"eval_prec_micro": 0.8900398406373793, |
|
"eval_rec_at_5": 0.976027397260274, |
|
"eval_rec_at_8": 0.9794520547945206, |
|
"eval_rec_macro": 0.9176060797993615, |
|
"eval_rec_micro": 0.9262023217246329, |
|
"eval_runtime": 6.4724, |
|
"eval_samples_per_second": 135.345, |
|
"eval_steps_per_second": 16.995, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 0.16448086500167847, |
|
"learning_rate": 0.0003, |
|
"loss": 0.0471, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_acc_macro": 0.8271437680276396, |
|
"eval_acc_micro": 0.8323529411764093, |
|
"eval_auc_macro": 0.993671108576282, |
|
"eval_auc_micro": 0.9937186337101654, |
|
"eval_f1_at_5": 0.4285323653750887, |
|
"eval_f1_at_8": 0.29274329072668936, |
|
"eval_f1_macro": 0.9038769548624298, |
|
"eval_f1_micro": 0.9085072231138916, |
|
"eval_loss": 0.06305181980133057, |
|
"eval_prec_at_5": 0.27442922374429224, |
|
"eval_prec_at_8": 0.1720890410958904, |
|
"eval_prec_macro": 0.8786407478949387, |
|
"eval_prec_micro": 0.8802488335924665, |
|
"eval_rec_at_5": 0.977359208523592, |
|
"eval_rec_at_8": 0.9794520547945206, |
|
"eval_rec_macro": 0.9344636739690416, |
|
"eval_rec_micro": 0.9386401326699055, |
|
"eval_runtime": 6.3196, |
|
"eval_samples_per_second": 138.617, |
|
"eval_steps_per_second": 17.406, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 0.22940804064273834, |
|
"learning_rate": 0.0003, |
|
"loss": 0.0292, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_acc_macro": 0.8308612963912455, |
|
"eval_acc_micro": 0.8424710424709774, |
|
"eval_auc_macro": 0.9930217118288992, |
|
"eval_auc_micro": 0.9944139892271574, |
|
"eval_f1_at_5": 0.4295136788854873, |
|
"eval_f1_at_8": 0.29274329072668936, |
|
"eval_f1_macro": 0.90558341223627, |
|
"eval_f1_micro": 0.9145012573343744, |
|
"eval_loss": 0.06955315172672272, |
|
"eval_prec_at_5": 0.2751141552511416, |
|
"eval_prec_at_8": 0.1720890410958904, |
|
"eval_prec_macro": 0.9134147654048902, |
|
"eval_prec_micro": 0.9245762711863623, |
|
"eval_rec_at_5": 0.9788812785388128, |
|
"eval_rec_at_8": 0.9794520547945206, |
|
"eval_rec_macro": 0.9000407679288313, |
|
"eval_rec_micro": 0.9046434494194938, |
|
"eval_runtime": 6.3259, |
|
"eval_samples_per_second": 138.479, |
|
"eval_steps_per_second": 17.389, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 0.14079643785953522, |
|
"learning_rate": 0.0003, |
|
"loss": 0.0169, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_acc_macro": 0.8220596818065521, |
|
"eval_acc_micro": 0.8319327731091801, |
|
"eval_auc_macro": 0.9927035556143388, |
|
"eval_auc_micro": 0.9939625962172801, |
|
"eval_f1_at_5": 0.4277378477874334, |
|
"eval_f1_at_8": 0.29274329072668936, |
|
"eval_f1_macro": 0.8993295914850711, |
|
"eval_f1_micro": 0.9082568807338691, |
|
"eval_loss": 0.07188171148300171, |
|
"eval_prec_at_5": 0.27397260273972607, |
|
"eval_prec_at_8": 0.1720890410958904, |
|
"eval_prec_macro": 0.9063614647378323, |
|
"eval_prec_micro": 0.913590604026769, |
|
"eval_rec_at_5": 0.9748858447488584, |
|
"eval_rec_at_8": 0.9794520547945206, |
|
"eval_rec_macro": 0.8937033781116202, |
|
"eval_rec_micro": 0.9029850746267908, |
|
"eval_runtime": 6.3449, |
|
"eval_samples_per_second": 138.064, |
|
"eval_steps_per_second": 17.337, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 0.12200725823640823, |
|
"learning_rate": 0.0003, |
|
"loss": 0.0095, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_acc_macro": 0.8261283592776246, |
|
"eval_acc_micro": 0.8320433436531863, |
|
"eval_auc_macro": 0.9914073448442141, |
|
"eval_auc_micro": 0.9922562843066707, |
|
"eval_f1_at_5": 0.42747783226694747, |
|
"eval_f1_at_8": 0.2925113305987028, |
|
"eval_f1_macro": 0.9026710595366999, |
|
"eval_f1_micro": 0.9083227714405654, |
|
"eval_loss": 0.09724259376525879, |
|
"eval_prec_at_5": 0.27374429223744295, |
|
"eval_prec_at_8": 0.17194634703196346, |
|
"eval_prec_macro": 0.9186608707729786, |
|
"eval_prec_micro": 0.9259259259258461, |
|
"eval_rec_at_5": 0.975076103500761, |
|
"eval_rec_at_8": 0.9788812785388128, |
|
"eval_rec_macro": 0.8890001231603133, |
|
"eval_rec_micro": 0.8913764510778697, |
|
"eval_runtime": 6.3561, |
|
"eval_samples_per_second": 137.82, |
|
"eval_steps_per_second": 17.306, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 0.1273776739835739, |
|
"learning_rate": 0.0003, |
|
"loss": 0.0061, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_acc_macro": 0.8331638553801589, |
|
"eval_acc_micro": 0.8417047184169831, |
|
"eval_auc_macro": 0.9887523718801591, |
|
"eval_auc_micro": 0.9910290762677764, |
|
"eval_f1_at_5": 0.42681135828205624, |
|
"eval_f1_at_8": 0.29225388037164507, |
|
"eval_f1_macro": 0.9063403443920213, |
|
"eval_f1_micro": 0.9140495867767839, |
|
"eval_loss": 0.09798464179039001, |
|
"eval_prec_at_5": 0.2732876712328767, |
|
"eval_prec_at_8": 0.17180365296803654, |
|
"eval_prec_macro": 0.9010794509609382, |
|
"eval_prec_micro": 0.9110378912684587, |
|
"eval_rec_at_5": 0.9739345509893454, |
|
"eval_rec_at_8": 0.9777397260273972, |
|
"eval_rec_macro": 0.9130526960570995, |
|
"eval_rec_micro": 0.9170812603647663, |
|
"eval_runtime": 6.4145, |
|
"eval_samples_per_second": 136.565, |
|
"eval_steps_per_second": 17.149, |
|
"step": 192 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 960, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 40, |
|
"save_steps": 500, |
|
"total_flos": 0.0, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|