nickthegroot's picture
End of training
37cea4d unverified
{
"best_metric": 0.5854,
"best_model_checkpoint": "/home/azureuser/cloudfiles/code/Users/nick.degroot/page-segmentation/runs/20250307-table-transformer-is-floorplan/checkpoint-14237",
"epoch": 23.0,
"eval_steps": 500,
"global_step": 14237,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 12.473027229309082,
"learning_rate": 4.9e-05,
"loss": 0.9573,
"step": 619
},
{
"epoch": 1.0,
"eval_loss": 1.048191785812378,
"eval_map": 0.4914,
"eval_map_50": 0.7176,
"eval_map_75": 0.5594,
"eval_map_large": 0.4916,
"eval_map_layer_floorplan": 0.4995,
"eval_map_layer_non_floorplan": 0.4832,
"eval_map_medium": 0.0,
"eval_map_small": 0.0,
"eval_mar_1": 0.4913,
"eval_mar_10": 0.7178,
"eval_mar_100": 0.7221,
"eval_mar_100_layer_floorplan": 0.7331,
"eval_mar_100_layer_non_floorplan": 0.7112,
"eval_mar_large": 0.7225,
"eval_mar_medium": 0.0,
"eval_mar_small": 0.0,
"eval_runtime": 96.7259,
"eval_samples_per_second": 22.734,
"eval_steps_per_second": 1.427,
"step": 619
},
{
"epoch": 2.0,
"grad_norm": 10.47475528717041,
"learning_rate": 4.8e-05,
"loss": 0.9177,
"step": 1238
},
{
"epoch": 2.0,
"eval_loss": 1.0183632373809814,
"eval_map": 0.5167,
"eval_map_50": 0.7402,
"eval_map_75": 0.5901,
"eval_map_large": 0.517,
"eval_map_layer_floorplan": 0.524,
"eval_map_layer_non_floorplan": 0.5093,
"eval_map_medium": 0.0,
"eval_map_small": 0.0,
"eval_mar_1": 0.5002,
"eval_mar_10": 0.7294,
"eval_mar_100": 0.7339,
"eval_mar_100_layer_floorplan": 0.74,
"eval_mar_100_layer_non_floorplan": 0.7278,
"eval_mar_large": 0.7343,
"eval_mar_medium": 0.0,
"eval_mar_small": 0.0,
"eval_runtime": 98.7563,
"eval_samples_per_second": 22.267,
"eval_steps_per_second": 1.397,
"step": 1238
},
{
"epoch": 3.0,
"grad_norm": 20.04204750061035,
"learning_rate": 4.7e-05,
"loss": 0.8733,
"step": 1857
},
{
"epoch": 3.0,
"eval_loss": 1.004949927330017,
"eval_map": 0.513,
"eval_map_50": 0.7336,
"eval_map_75": 0.592,
"eval_map_large": 0.5133,
"eval_map_layer_floorplan": 0.5146,
"eval_map_layer_non_floorplan": 0.5115,
"eval_map_medium": 0.101,
"eval_map_small": 0.0,
"eval_mar_1": 0.5033,
"eval_mar_10": 0.7314,
"eval_mar_100": 0.7355,
"eval_mar_100_layer_floorplan": 0.7343,
"eval_mar_100_layer_non_floorplan": 0.7367,
"eval_mar_large": 0.7359,
"eval_mar_medium": 0.1,
"eval_mar_small": 0.0,
"eval_runtime": 99.4564,
"eval_samples_per_second": 22.11,
"eval_steps_per_second": 1.388,
"step": 1857
},
{
"epoch": 4.0,
"grad_norm": 13.674722671508789,
"learning_rate": 4.600000000000001e-05,
"loss": 0.8412,
"step": 2476
},
{
"epoch": 4.0,
"eval_loss": 0.9946977496147156,
"eval_map": 0.5209,
"eval_map_50": 0.7417,
"eval_map_75": 0.6007,
"eval_map_large": 0.5212,
"eval_map_layer_floorplan": 0.5212,
"eval_map_layer_non_floorplan": 0.5207,
"eval_map_medium": 0.0,
"eval_map_small": 0.0,
"eval_mar_1": 0.5025,
"eval_mar_10": 0.7295,
"eval_mar_100": 0.7341,
"eval_mar_100_layer_floorplan": 0.7329,
"eval_mar_100_layer_non_floorplan": 0.7352,
"eval_mar_large": 0.7345,
"eval_mar_medium": 0.0,
"eval_mar_small": 0.0,
"eval_runtime": 99.2293,
"eval_samples_per_second": 22.161,
"eval_steps_per_second": 1.391,
"step": 2476
},
{
"epoch": 5.0,
"grad_norm": 16.09870719909668,
"learning_rate": 4.5e-05,
"loss": 0.8108,
"step": 3095
},
{
"epoch": 5.0,
"eval_loss": 1.0007381439208984,
"eval_map": 0.5323,
"eval_map_50": 0.76,
"eval_map_75": 0.6165,
"eval_map_large": 0.5326,
"eval_map_layer_floorplan": 0.5335,
"eval_map_layer_non_floorplan": 0.5311,
"eval_map_medium": 0.0,
"eval_map_small": 0.0,
"eval_mar_1": 0.4993,
"eval_mar_10": 0.7173,
"eval_mar_100": 0.7217,
"eval_mar_100_layer_floorplan": 0.7096,
"eval_mar_100_layer_non_floorplan": 0.7339,
"eval_mar_large": 0.7221,
"eval_mar_medium": 0.0,
"eval_mar_small": 0.0,
"eval_runtime": 102.6206,
"eval_samples_per_second": 21.428,
"eval_steps_per_second": 1.345,
"step": 3095
},
{
"epoch": 6.0,
"grad_norm": 12.526081085205078,
"learning_rate": 4.4000000000000006e-05,
"loss": 0.7762,
"step": 3714
},
{
"epoch": 6.0,
"eval_loss": 1.002115249633789,
"eval_map": 0.5456,
"eval_map_50": 0.7755,
"eval_map_75": 0.6331,
"eval_map_large": 0.5459,
"eval_map_layer_floorplan": 0.5596,
"eval_map_layer_non_floorplan": 0.5315,
"eval_map_medium": 0.0,
"eval_map_small": 0.0,
"eval_mar_1": 0.5189,
"eval_mar_10": 0.7423,
"eval_mar_100": 0.7473,
"eval_mar_100_layer_floorplan": 0.7634,
"eval_mar_100_layer_non_floorplan": 0.7312,
"eval_mar_large": 0.7477,
"eval_mar_medium": 0.0,
"eval_mar_small": 0.0,
"eval_runtime": 198.1173,
"eval_samples_per_second": 11.099,
"eval_steps_per_second": 0.697,
"step": 3714
},
{
"epoch": 7.0,
"grad_norm": 14.044904708862305,
"learning_rate": 4.3e-05,
"loss": 0.7409,
"step": 4333
},
{
"epoch": 7.0,
"eval_loss": 0.980305552482605,
"eval_map": 0.5279,
"eval_map_50": 0.742,
"eval_map_75": 0.6106,
"eval_map_large": 0.5283,
"eval_map_layer_floorplan": 0.519,
"eval_map_layer_non_floorplan": 0.5369,
"eval_map_medium": 0.0,
"eval_map_small": 0.0,
"eval_mar_1": 0.499,
"eval_mar_10": 0.713,
"eval_mar_100": 0.7182,
"eval_mar_100_layer_floorplan": 0.6898,
"eval_mar_100_layer_non_floorplan": 0.7465,
"eval_mar_large": 0.7186,
"eval_mar_medium": 0.0,
"eval_mar_small": 0.0,
"eval_runtime": 209.8003,
"eval_samples_per_second": 10.481,
"eval_steps_per_second": 0.658,
"step": 4333
},
{
"epoch": 8.0,
"grad_norm": 9.8011474609375,
"learning_rate": 4.2e-05,
"loss": 0.7191,
"step": 4952
},
{
"epoch": 8.0,
"eval_loss": 0.9737862348556519,
"eval_map": 0.5495,
"eval_map_50": 0.7693,
"eval_map_75": 0.6357,
"eval_map_large": 0.5497,
"eval_map_layer_floorplan": 0.5569,
"eval_map_layer_non_floorplan": 0.542,
"eval_map_medium": 0.101,
"eval_map_small": 0.0,
"eval_mar_1": 0.5066,
"eval_mar_10": 0.7273,
"eval_mar_100": 0.7321,
"eval_mar_100_layer_floorplan": 0.7217,
"eval_mar_100_layer_non_floorplan": 0.7424,
"eval_mar_large": 0.7324,
"eval_mar_medium": 0.1,
"eval_mar_small": 0.0,
"eval_runtime": 144.0008,
"eval_samples_per_second": 15.271,
"eval_steps_per_second": 0.958,
"step": 4952
},
{
"epoch": 9.0,
"grad_norm": 17.39337730407715,
"learning_rate": 4.1e-05,
"loss": 0.6875,
"step": 5571
},
{
"epoch": 9.0,
"eval_loss": 0.9566386938095093,
"eval_map": 0.5568,
"eval_map_50": 0.7737,
"eval_map_75": 0.6427,
"eval_map_large": 0.5571,
"eval_map_layer_floorplan": 0.5738,
"eval_map_layer_non_floorplan": 0.5398,
"eval_map_medium": 0.101,
"eval_map_small": 0.0,
"eval_mar_1": 0.5216,
"eval_mar_10": 0.7445,
"eval_mar_100": 0.7495,
"eval_mar_100_layer_floorplan": 0.7502,
"eval_mar_100_layer_non_floorplan": 0.7488,
"eval_mar_large": 0.7499,
"eval_mar_medium": 0.1,
"eval_mar_small": 0.0,
"eval_runtime": 196.7202,
"eval_samples_per_second": 11.178,
"eval_steps_per_second": 0.702,
"step": 5571
},
{
"epoch": 10.0,
"grad_norm": 23.622432708740234,
"learning_rate": 4e-05,
"loss": 0.6574,
"step": 6190
},
{
"epoch": 10.0,
"eval_loss": 0.9592899084091187,
"eval_map": 0.566,
"eval_map_50": 0.7816,
"eval_map_75": 0.6534,
"eval_map_large": 0.5663,
"eval_map_layer_floorplan": 0.5839,
"eval_map_layer_non_floorplan": 0.5481,
"eval_map_medium": 0.101,
"eval_map_small": 0.0,
"eval_mar_1": 0.5291,
"eval_mar_10": 0.7545,
"eval_mar_100": 0.7593,
"eval_mar_100_layer_floorplan": 0.771,
"eval_mar_100_layer_non_floorplan": 0.7477,
"eval_mar_large": 0.7597,
"eval_mar_medium": 0.1,
"eval_mar_small": 0.0,
"eval_runtime": 202.0923,
"eval_samples_per_second": 10.881,
"eval_steps_per_second": 0.683,
"step": 6190
},
{
"epoch": 11.0,
"grad_norm": 13.85277271270752,
"learning_rate": 3.9000000000000006e-05,
"loss": 0.6332,
"step": 6809
},
{
"epoch": 11.0,
"eval_loss": 0.9667688012123108,
"eval_map": 0.5658,
"eval_map_50": 0.7827,
"eval_map_75": 0.6532,
"eval_map_large": 0.566,
"eval_map_layer_floorplan": 0.5933,
"eval_map_layer_non_floorplan": 0.5382,
"eval_map_medium": 0.0505,
"eval_map_small": 0.0,
"eval_mar_1": 0.5277,
"eval_mar_10": 0.7522,
"eval_mar_100": 0.7575,
"eval_mar_100_layer_floorplan": 0.7712,
"eval_mar_100_layer_non_floorplan": 0.7439,
"eval_mar_large": 0.7579,
"eval_mar_medium": 0.05,
"eval_mar_small": 0.0,
"eval_runtime": 160.7511,
"eval_samples_per_second": 13.68,
"eval_steps_per_second": 0.858,
"step": 6809
},
{
"epoch": 12.0,
"grad_norm": 9.858610153198242,
"learning_rate": 3.8e-05,
"loss": 0.607,
"step": 7428
},
{
"epoch": 12.0,
"eval_loss": 0.9639933109283447,
"eval_map": 0.5617,
"eval_map_50": 0.7748,
"eval_map_75": 0.6539,
"eval_map_large": 0.562,
"eval_map_layer_floorplan": 0.5682,
"eval_map_layer_non_floorplan": 0.5553,
"eval_map_medium": 0.1515,
"eval_map_small": 0.0,
"eval_mar_1": 0.5244,
"eval_mar_10": 0.7477,
"eval_mar_100": 0.7535,
"eval_mar_100_layer_floorplan": 0.7554,
"eval_mar_100_layer_non_floorplan": 0.7517,
"eval_mar_large": 0.7539,
"eval_mar_medium": 0.15,
"eval_mar_small": 0.0,
"eval_runtime": 291.5919,
"eval_samples_per_second": 7.541,
"eval_steps_per_second": 0.473,
"step": 7428
},
{
"epoch": 13.0,
"grad_norm": 12.362223625183105,
"learning_rate": 3.7e-05,
"loss": 0.5848,
"step": 8047
},
{
"epoch": 13.0,
"eval_loss": 0.9631391167640686,
"eval_map": 0.5616,
"eval_map_50": 0.7762,
"eval_map_75": 0.6555,
"eval_map_large": 0.5619,
"eval_map_layer_floorplan": 0.5612,
"eval_map_layer_non_floorplan": 0.562,
"eval_map_medium": 0.202,
"eval_map_small": 0.0,
"eval_mar_1": 0.5228,
"eval_mar_10": 0.7442,
"eval_mar_100": 0.7493,
"eval_mar_100_layer_floorplan": 0.7451,
"eval_mar_100_layer_non_floorplan": 0.7534,
"eval_mar_large": 0.7496,
"eval_mar_medium": 0.2,
"eval_mar_small": 0.0,
"eval_runtime": 96.8323,
"eval_samples_per_second": 22.709,
"eval_steps_per_second": 1.425,
"step": 8047
},
{
"epoch": 14.0,
"grad_norm": 13.06834888458252,
"learning_rate": 3.6e-05,
"loss": 0.5699,
"step": 8666
},
{
"epoch": 14.0,
"eval_loss": 0.9597959518432617,
"eval_map": 0.5661,
"eval_map_50": 0.7729,
"eval_map_75": 0.6515,
"eval_map_large": 0.5663,
"eval_map_layer_floorplan": 0.5704,
"eval_map_layer_non_floorplan": 0.5618,
"eval_map_medium": 0.303,
"eval_map_small": 0.0,
"eval_mar_1": 0.5281,
"eval_mar_10": 0.7506,
"eval_mar_100": 0.7559,
"eval_mar_100_layer_floorplan": 0.7567,
"eval_mar_100_layer_non_floorplan": 0.755,
"eval_mar_large": 0.7562,
"eval_mar_medium": 0.3,
"eval_mar_small": 0.0,
"eval_runtime": 95.7299,
"eval_samples_per_second": 22.971,
"eval_steps_per_second": 1.442,
"step": 8666
},
{
"epoch": 15.0,
"grad_norm": 14.259442329406738,
"learning_rate": 3.5e-05,
"loss": 0.5423,
"step": 9285
},
{
"epoch": 15.0,
"eval_loss": 0.9839197993278503,
"eval_map": 0.5705,
"eval_map_50": 0.7785,
"eval_map_75": 0.657,
"eval_map_large": 0.5708,
"eval_map_layer_floorplan": 0.5797,
"eval_map_layer_non_floorplan": 0.5612,
"eval_map_medium": 0.101,
"eval_map_small": 0.0,
"eval_mar_1": 0.5305,
"eval_mar_10": 0.7529,
"eval_mar_100": 0.7584,
"eval_mar_100_layer_floorplan": 0.7634,
"eval_mar_100_layer_non_floorplan": 0.7534,
"eval_mar_large": 0.7588,
"eval_mar_medium": 0.1,
"eval_mar_small": 0.0,
"eval_runtime": 97.4975,
"eval_samples_per_second": 22.554,
"eval_steps_per_second": 1.415,
"step": 9285
},
{
"epoch": 16.0,
"grad_norm": 18.98026466369629,
"learning_rate": 3.4000000000000007e-05,
"loss": 0.5249,
"step": 9904
},
{
"epoch": 16.0,
"eval_loss": 0.9859117865562439,
"eval_map": 0.5662,
"eval_map_50": 0.7755,
"eval_map_75": 0.6497,
"eval_map_large": 0.5663,
"eval_map_layer_floorplan": 0.5673,
"eval_map_layer_non_floorplan": 0.565,
"eval_map_medium": 0.404,
"eval_map_small": 0.0,
"eval_mar_1": 0.5144,
"eval_mar_10": 0.7364,
"eval_mar_100": 0.7422,
"eval_mar_100_layer_floorplan": 0.726,
"eval_mar_100_layer_non_floorplan": 0.7583,
"eval_mar_large": 0.7424,
"eval_mar_medium": 0.4,
"eval_mar_small": 0.0,
"eval_runtime": 98.0807,
"eval_samples_per_second": 22.42,
"eval_steps_per_second": 1.407,
"step": 9904
},
{
"epoch": 17.0,
"grad_norm": 10.991700172424316,
"learning_rate": 3.3e-05,
"loss": 0.5071,
"step": 10523
},
{
"epoch": 17.0,
"eval_loss": 0.9921765923500061,
"eval_map": 0.5737,
"eval_map_50": 0.7827,
"eval_map_75": 0.6516,
"eval_map_large": 0.5739,
"eval_map_layer_floorplan": 0.5805,
"eval_map_layer_non_floorplan": 0.567,
"eval_map_medium": 0.303,
"eval_map_small": 0.0,
"eval_mar_1": 0.5194,
"eval_mar_10": 0.7465,
"eval_mar_100": 0.7525,
"eval_mar_100_layer_floorplan": 0.7471,
"eval_mar_100_layer_non_floorplan": 0.7579,
"eval_mar_large": 0.7528,
"eval_mar_medium": 0.3,
"eval_mar_small": 0.0,
"eval_runtime": 114.1971,
"eval_samples_per_second": 19.256,
"eval_steps_per_second": 1.208,
"step": 10523
},
{
"epoch": 18.0,
"grad_norm": 11.373696327209473,
"learning_rate": 3.2000000000000005e-05,
"loss": 0.4895,
"step": 11142
},
{
"epoch": 18.0,
"eval_loss": 0.9796280860900879,
"eval_map": 0.5763,
"eval_map_50": 0.7822,
"eval_map_75": 0.6614,
"eval_map_large": 0.5767,
"eval_map_layer_floorplan": 0.5869,
"eval_map_layer_non_floorplan": 0.5658,
"eval_map_medium": 0.101,
"eval_map_small": 0.0,
"eval_mar_1": 0.5269,
"eval_mar_10": 0.7526,
"eval_mar_100": 0.7583,
"eval_mar_100_layer_floorplan": 0.7582,
"eval_mar_100_layer_non_floorplan": 0.7584,
"eval_mar_large": 0.7587,
"eval_mar_medium": 0.1,
"eval_mar_small": 0.0,
"eval_runtime": 164.2202,
"eval_samples_per_second": 13.391,
"eval_steps_per_second": 0.84,
"step": 11142
},
{
"epoch": 19.0,
"grad_norm": 15.639002799987793,
"learning_rate": 3.1e-05,
"loss": 0.4784,
"step": 11761
},
{
"epoch": 19.0,
"eval_loss": 0.9923657774925232,
"eval_map": 0.5794,
"eval_map_50": 0.7862,
"eval_map_75": 0.6607,
"eval_map_large": 0.5797,
"eval_map_layer_floorplan": 0.5907,
"eval_map_layer_non_floorplan": 0.5682,
"eval_map_medium": 0.2525,
"eval_map_small": 0.0,
"eval_mar_1": 0.5286,
"eval_mar_10": 0.7549,
"eval_mar_100": 0.7611,
"eval_mar_100_layer_floorplan": 0.76,
"eval_mar_100_layer_non_floorplan": 0.7623,
"eval_mar_large": 0.7614,
"eval_mar_medium": 0.25,
"eval_mar_small": 0.0,
"eval_runtime": 148.8739,
"eval_samples_per_second": 14.771,
"eval_steps_per_second": 0.927,
"step": 11761
},
{
"epoch": 20.0,
"grad_norm": 11.518092155456543,
"learning_rate": 3e-05,
"loss": 0.4621,
"step": 12380
},
{
"epoch": 20.0,
"eval_loss": 0.9944785833358765,
"eval_map": 0.5815,
"eval_map_50": 0.7851,
"eval_map_75": 0.6678,
"eval_map_large": 0.5816,
"eval_map_layer_floorplan": 0.5936,
"eval_map_layer_non_floorplan": 0.5694,
"eval_map_medium": 0.404,
"eval_map_small": 0.0,
"eval_mar_1": 0.53,
"eval_mar_10": 0.7575,
"eval_mar_100": 0.7625,
"eval_mar_100_layer_floorplan": 0.7674,
"eval_mar_100_layer_non_floorplan": 0.7576,
"eval_mar_large": 0.7628,
"eval_mar_medium": 0.4,
"eval_mar_small": 0.0,
"eval_runtime": 150.1731,
"eval_samples_per_second": 14.643,
"eval_steps_per_second": 0.919,
"step": 12380
},
{
"epoch": 21.0,
"grad_norm": 11.369315147399902,
"learning_rate": 2.9e-05,
"loss": 0.4484,
"step": 12999
},
{
"epoch": 21.0,
"eval_loss": 1.0060081481933594,
"eval_map": 0.5747,
"eval_map_50": 0.7778,
"eval_map_75": 0.6543,
"eval_map_large": 0.575,
"eval_map_layer_floorplan": 0.5877,
"eval_map_layer_non_floorplan": 0.5617,
"eval_map_medium": 0.202,
"eval_map_small": 0.0,
"eval_mar_1": 0.5261,
"eval_mar_10": 0.7515,
"eval_mar_100": 0.7567,
"eval_mar_100_layer_floorplan": 0.7567,
"eval_mar_100_layer_non_floorplan": 0.7567,
"eval_mar_large": 0.7571,
"eval_mar_medium": 0.2,
"eval_mar_small": 0.0,
"eval_runtime": 129.9803,
"eval_samples_per_second": 16.918,
"eval_steps_per_second": 1.062,
"step": 12999
},
{
"epoch": 22.0,
"grad_norm": 14.859123229980469,
"learning_rate": 2.8000000000000003e-05,
"loss": 0.4358,
"step": 13618
},
{
"epoch": 22.0,
"eval_loss": 0.9802154898643494,
"eval_map": 0.5826,
"eval_map_50": 0.7803,
"eval_map_75": 0.6678,
"eval_map_large": 0.5829,
"eval_map_layer_floorplan": 0.5968,
"eval_map_layer_non_floorplan": 0.5683,
"eval_map_medium": 0.0505,
"eval_map_small": 0.0,
"eval_mar_1": 0.5264,
"eval_mar_10": 0.7593,
"eval_mar_100": 0.7652,
"eval_mar_100_layer_floorplan": 0.7666,
"eval_mar_100_layer_non_floorplan": 0.7638,
"eval_mar_large": 0.7656,
"eval_mar_medium": 0.05,
"eval_mar_small": 0.0,
"eval_runtime": 127.1201,
"eval_samples_per_second": 17.299,
"eval_steps_per_second": 1.086,
"step": 13618
},
{
"epoch": 23.0,
"grad_norm": 12.832348823547363,
"learning_rate": 2.7000000000000002e-05,
"loss": 0.4236,
"step": 14237
},
{
"epoch": 23.0,
"eval_loss": 1.0017343759536743,
"eval_map": 0.5854,
"eval_map_50": 0.7887,
"eval_map_75": 0.671,
"eval_map_large": 0.5858,
"eval_map_layer_floorplan": 0.6009,
"eval_map_layer_non_floorplan": 0.5699,
"eval_map_medium": 0.0,
"eval_map_small": 0.0,
"eval_mar_1": 0.5276,
"eval_mar_10": 0.7597,
"eval_mar_100": 0.7648,
"eval_mar_100_layer_floorplan": 0.768,
"eval_mar_100_layer_non_floorplan": 0.7616,
"eval_mar_large": 0.7652,
"eval_mar_medium": 0.0,
"eval_mar_small": 0.0,
"eval_runtime": 219.2113,
"eval_samples_per_second": 10.031,
"eval_steps_per_second": 0.63,
"step": 14237
}
],
"logging_steps": 500,
"max_steps": 30950,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 5,
"early_stopping_threshold": 0.0
},
"attributes": {
"early_stopping_patience_counter": 0
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1.4729502081028093e+20,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}