{ "best_metric": 0.5854, "best_model_checkpoint": "/home/azureuser/cloudfiles/code/Users/nick.degroot/page-segmentation/runs/20250307-table-transformer-is-floorplan/checkpoint-14237", "epoch": 23.0, "eval_steps": 500, "global_step": 14237, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "grad_norm": 12.473027229309082, "learning_rate": 4.9e-05, "loss": 0.9573, "step": 619 }, { "epoch": 1.0, "eval_loss": 1.048191785812378, "eval_map": 0.4914, "eval_map_50": 0.7176, "eval_map_75": 0.5594, "eval_map_large": 0.4916, "eval_map_layer_floorplan": 0.4995, "eval_map_layer_non_floorplan": 0.4832, "eval_map_medium": 0.0, "eval_map_small": 0.0, "eval_mar_1": 0.4913, "eval_mar_10": 0.7178, "eval_mar_100": 0.7221, "eval_mar_100_layer_floorplan": 0.7331, "eval_mar_100_layer_non_floorplan": 0.7112, "eval_mar_large": 0.7225, "eval_mar_medium": 0.0, "eval_mar_small": 0.0, "eval_runtime": 96.7259, "eval_samples_per_second": 22.734, "eval_steps_per_second": 1.427, "step": 619 }, { "epoch": 2.0, "grad_norm": 10.47475528717041, "learning_rate": 4.8e-05, "loss": 0.9177, "step": 1238 }, { "epoch": 2.0, "eval_loss": 1.0183632373809814, "eval_map": 0.5167, "eval_map_50": 0.7402, "eval_map_75": 0.5901, "eval_map_large": 0.517, "eval_map_layer_floorplan": 0.524, "eval_map_layer_non_floorplan": 0.5093, "eval_map_medium": 0.0, "eval_map_small": 0.0, "eval_mar_1": 0.5002, "eval_mar_10": 0.7294, "eval_mar_100": 0.7339, "eval_mar_100_layer_floorplan": 0.74, "eval_mar_100_layer_non_floorplan": 0.7278, "eval_mar_large": 0.7343, "eval_mar_medium": 0.0, "eval_mar_small": 0.0, "eval_runtime": 98.7563, "eval_samples_per_second": 22.267, "eval_steps_per_second": 1.397, "step": 1238 }, { "epoch": 3.0, "grad_norm": 20.04204750061035, "learning_rate": 4.7e-05, "loss": 0.8733, "step": 1857 }, { "epoch": 3.0, "eval_loss": 1.004949927330017, "eval_map": 0.513, "eval_map_50": 0.7336, "eval_map_75": 0.592, "eval_map_large": 0.5133, "eval_map_layer_floorplan": 0.5146, "eval_map_layer_non_floorplan": 0.5115, "eval_map_medium": 0.101, "eval_map_small": 0.0, "eval_mar_1": 0.5033, "eval_mar_10": 0.7314, "eval_mar_100": 0.7355, "eval_mar_100_layer_floorplan": 0.7343, "eval_mar_100_layer_non_floorplan": 0.7367, "eval_mar_large": 0.7359, "eval_mar_medium": 0.1, "eval_mar_small": 0.0, "eval_runtime": 99.4564, "eval_samples_per_second": 22.11, "eval_steps_per_second": 1.388, "step": 1857 }, { "epoch": 4.0, "grad_norm": 13.674722671508789, "learning_rate": 4.600000000000001e-05, "loss": 0.8412, "step": 2476 }, { "epoch": 4.0, "eval_loss": 0.9946977496147156, "eval_map": 0.5209, "eval_map_50": 0.7417, "eval_map_75": 0.6007, "eval_map_large": 0.5212, "eval_map_layer_floorplan": 0.5212, "eval_map_layer_non_floorplan": 0.5207, "eval_map_medium": 0.0, "eval_map_small": 0.0, "eval_mar_1": 0.5025, "eval_mar_10": 0.7295, "eval_mar_100": 0.7341, "eval_mar_100_layer_floorplan": 0.7329, "eval_mar_100_layer_non_floorplan": 0.7352, "eval_mar_large": 0.7345, "eval_mar_medium": 0.0, "eval_mar_small": 0.0, "eval_runtime": 99.2293, "eval_samples_per_second": 22.161, "eval_steps_per_second": 1.391, "step": 2476 }, { "epoch": 5.0, "grad_norm": 16.09870719909668, "learning_rate": 4.5e-05, "loss": 0.8108, "step": 3095 }, { "epoch": 5.0, "eval_loss": 1.0007381439208984, "eval_map": 0.5323, "eval_map_50": 0.76, "eval_map_75": 0.6165, "eval_map_large": 0.5326, "eval_map_layer_floorplan": 0.5335, "eval_map_layer_non_floorplan": 0.5311, "eval_map_medium": 0.0, "eval_map_small": 0.0, "eval_mar_1": 0.4993, "eval_mar_10": 0.7173, "eval_mar_100": 0.7217, "eval_mar_100_layer_floorplan": 0.7096, "eval_mar_100_layer_non_floorplan": 0.7339, "eval_mar_large": 0.7221, "eval_mar_medium": 0.0, "eval_mar_small": 0.0, "eval_runtime": 102.6206, "eval_samples_per_second": 21.428, "eval_steps_per_second": 1.345, "step": 3095 }, { "epoch": 6.0, "grad_norm": 12.526081085205078, "learning_rate": 4.4000000000000006e-05, "loss": 0.7762, "step": 3714 }, { "epoch": 6.0, "eval_loss": 1.002115249633789, "eval_map": 0.5456, "eval_map_50": 0.7755, "eval_map_75": 0.6331, "eval_map_large": 0.5459, "eval_map_layer_floorplan": 0.5596, "eval_map_layer_non_floorplan": 0.5315, "eval_map_medium": 0.0, "eval_map_small": 0.0, "eval_mar_1": 0.5189, "eval_mar_10": 0.7423, "eval_mar_100": 0.7473, "eval_mar_100_layer_floorplan": 0.7634, "eval_mar_100_layer_non_floorplan": 0.7312, "eval_mar_large": 0.7477, "eval_mar_medium": 0.0, "eval_mar_small": 0.0, "eval_runtime": 198.1173, "eval_samples_per_second": 11.099, "eval_steps_per_second": 0.697, "step": 3714 }, { "epoch": 7.0, "grad_norm": 14.044904708862305, "learning_rate": 4.3e-05, "loss": 0.7409, "step": 4333 }, { "epoch": 7.0, "eval_loss": 0.980305552482605, "eval_map": 0.5279, "eval_map_50": 0.742, "eval_map_75": 0.6106, "eval_map_large": 0.5283, "eval_map_layer_floorplan": 0.519, "eval_map_layer_non_floorplan": 0.5369, "eval_map_medium": 0.0, "eval_map_small": 0.0, "eval_mar_1": 0.499, "eval_mar_10": 0.713, "eval_mar_100": 0.7182, "eval_mar_100_layer_floorplan": 0.6898, "eval_mar_100_layer_non_floorplan": 0.7465, "eval_mar_large": 0.7186, "eval_mar_medium": 0.0, "eval_mar_small": 0.0, "eval_runtime": 209.8003, "eval_samples_per_second": 10.481, "eval_steps_per_second": 0.658, "step": 4333 }, { "epoch": 8.0, "grad_norm": 9.8011474609375, "learning_rate": 4.2e-05, "loss": 0.7191, "step": 4952 }, { "epoch": 8.0, "eval_loss": 0.9737862348556519, "eval_map": 0.5495, "eval_map_50": 0.7693, "eval_map_75": 0.6357, "eval_map_large": 0.5497, "eval_map_layer_floorplan": 0.5569, "eval_map_layer_non_floorplan": 0.542, "eval_map_medium": 0.101, "eval_map_small": 0.0, "eval_mar_1": 0.5066, "eval_mar_10": 0.7273, "eval_mar_100": 0.7321, "eval_mar_100_layer_floorplan": 0.7217, "eval_mar_100_layer_non_floorplan": 0.7424, "eval_mar_large": 0.7324, "eval_mar_medium": 0.1, "eval_mar_small": 0.0, "eval_runtime": 144.0008, "eval_samples_per_second": 15.271, "eval_steps_per_second": 0.958, "step": 4952 }, { "epoch": 9.0, "grad_norm": 17.39337730407715, "learning_rate": 4.1e-05, "loss": 0.6875, "step": 5571 }, { "epoch": 9.0, "eval_loss": 0.9566386938095093, "eval_map": 0.5568, "eval_map_50": 0.7737, "eval_map_75": 0.6427, "eval_map_large": 0.5571, "eval_map_layer_floorplan": 0.5738, "eval_map_layer_non_floorplan": 0.5398, "eval_map_medium": 0.101, "eval_map_small": 0.0, "eval_mar_1": 0.5216, "eval_mar_10": 0.7445, "eval_mar_100": 0.7495, "eval_mar_100_layer_floorplan": 0.7502, "eval_mar_100_layer_non_floorplan": 0.7488, "eval_mar_large": 0.7499, "eval_mar_medium": 0.1, "eval_mar_small": 0.0, "eval_runtime": 196.7202, "eval_samples_per_second": 11.178, "eval_steps_per_second": 0.702, "step": 5571 }, { "epoch": 10.0, "grad_norm": 23.622432708740234, "learning_rate": 4e-05, "loss": 0.6574, "step": 6190 }, { "epoch": 10.0, "eval_loss": 0.9592899084091187, "eval_map": 0.566, "eval_map_50": 0.7816, "eval_map_75": 0.6534, "eval_map_large": 0.5663, "eval_map_layer_floorplan": 0.5839, "eval_map_layer_non_floorplan": 0.5481, "eval_map_medium": 0.101, "eval_map_small": 0.0, "eval_mar_1": 0.5291, "eval_mar_10": 0.7545, "eval_mar_100": 0.7593, "eval_mar_100_layer_floorplan": 0.771, "eval_mar_100_layer_non_floorplan": 0.7477, "eval_mar_large": 0.7597, "eval_mar_medium": 0.1, "eval_mar_small": 0.0, "eval_runtime": 202.0923, "eval_samples_per_second": 10.881, "eval_steps_per_second": 0.683, "step": 6190 }, { "epoch": 11.0, "grad_norm": 13.85277271270752, "learning_rate": 3.9000000000000006e-05, "loss": 0.6332, "step": 6809 }, { "epoch": 11.0, "eval_loss": 0.9667688012123108, "eval_map": 0.5658, "eval_map_50": 0.7827, "eval_map_75": 0.6532, "eval_map_large": 0.566, "eval_map_layer_floorplan": 0.5933, "eval_map_layer_non_floorplan": 0.5382, "eval_map_medium": 0.0505, "eval_map_small": 0.0, "eval_mar_1": 0.5277, "eval_mar_10": 0.7522, "eval_mar_100": 0.7575, "eval_mar_100_layer_floorplan": 0.7712, "eval_mar_100_layer_non_floorplan": 0.7439, "eval_mar_large": 0.7579, "eval_mar_medium": 0.05, "eval_mar_small": 0.0, "eval_runtime": 160.7511, "eval_samples_per_second": 13.68, "eval_steps_per_second": 0.858, "step": 6809 }, { "epoch": 12.0, "grad_norm": 9.858610153198242, "learning_rate": 3.8e-05, "loss": 0.607, "step": 7428 }, { "epoch": 12.0, "eval_loss": 0.9639933109283447, "eval_map": 0.5617, "eval_map_50": 0.7748, "eval_map_75": 0.6539, "eval_map_large": 0.562, "eval_map_layer_floorplan": 0.5682, "eval_map_layer_non_floorplan": 0.5553, "eval_map_medium": 0.1515, "eval_map_small": 0.0, "eval_mar_1": 0.5244, "eval_mar_10": 0.7477, "eval_mar_100": 0.7535, "eval_mar_100_layer_floorplan": 0.7554, "eval_mar_100_layer_non_floorplan": 0.7517, "eval_mar_large": 0.7539, "eval_mar_medium": 0.15, "eval_mar_small": 0.0, "eval_runtime": 291.5919, "eval_samples_per_second": 7.541, "eval_steps_per_second": 0.473, "step": 7428 }, { "epoch": 13.0, "grad_norm": 12.362223625183105, "learning_rate": 3.7e-05, "loss": 0.5848, "step": 8047 }, { "epoch": 13.0, "eval_loss": 0.9631391167640686, "eval_map": 0.5616, "eval_map_50": 0.7762, "eval_map_75": 0.6555, "eval_map_large": 0.5619, "eval_map_layer_floorplan": 0.5612, "eval_map_layer_non_floorplan": 0.562, "eval_map_medium": 0.202, "eval_map_small": 0.0, "eval_mar_1": 0.5228, "eval_mar_10": 0.7442, "eval_mar_100": 0.7493, "eval_mar_100_layer_floorplan": 0.7451, "eval_mar_100_layer_non_floorplan": 0.7534, "eval_mar_large": 0.7496, "eval_mar_medium": 0.2, "eval_mar_small": 0.0, "eval_runtime": 96.8323, "eval_samples_per_second": 22.709, "eval_steps_per_second": 1.425, "step": 8047 }, { "epoch": 14.0, "grad_norm": 13.06834888458252, "learning_rate": 3.6e-05, "loss": 0.5699, "step": 8666 }, { "epoch": 14.0, "eval_loss": 0.9597959518432617, "eval_map": 0.5661, "eval_map_50": 0.7729, "eval_map_75": 0.6515, "eval_map_large": 0.5663, "eval_map_layer_floorplan": 0.5704, "eval_map_layer_non_floorplan": 0.5618, "eval_map_medium": 0.303, "eval_map_small": 0.0, "eval_mar_1": 0.5281, "eval_mar_10": 0.7506, "eval_mar_100": 0.7559, "eval_mar_100_layer_floorplan": 0.7567, "eval_mar_100_layer_non_floorplan": 0.755, "eval_mar_large": 0.7562, "eval_mar_medium": 0.3, "eval_mar_small": 0.0, "eval_runtime": 95.7299, "eval_samples_per_second": 22.971, "eval_steps_per_second": 1.442, "step": 8666 }, { "epoch": 15.0, "grad_norm": 14.259442329406738, "learning_rate": 3.5e-05, "loss": 0.5423, "step": 9285 }, { "epoch": 15.0, "eval_loss": 0.9839197993278503, "eval_map": 0.5705, "eval_map_50": 0.7785, "eval_map_75": 0.657, "eval_map_large": 0.5708, "eval_map_layer_floorplan": 0.5797, "eval_map_layer_non_floorplan": 0.5612, "eval_map_medium": 0.101, "eval_map_small": 0.0, "eval_mar_1": 0.5305, "eval_mar_10": 0.7529, "eval_mar_100": 0.7584, "eval_mar_100_layer_floorplan": 0.7634, "eval_mar_100_layer_non_floorplan": 0.7534, "eval_mar_large": 0.7588, "eval_mar_medium": 0.1, "eval_mar_small": 0.0, "eval_runtime": 97.4975, "eval_samples_per_second": 22.554, "eval_steps_per_second": 1.415, "step": 9285 }, { "epoch": 16.0, "grad_norm": 18.98026466369629, "learning_rate": 3.4000000000000007e-05, "loss": 0.5249, "step": 9904 }, { "epoch": 16.0, "eval_loss": 0.9859117865562439, "eval_map": 0.5662, "eval_map_50": 0.7755, "eval_map_75": 0.6497, "eval_map_large": 0.5663, "eval_map_layer_floorplan": 0.5673, "eval_map_layer_non_floorplan": 0.565, "eval_map_medium": 0.404, "eval_map_small": 0.0, "eval_mar_1": 0.5144, "eval_mar_10": 0.7364, "eval_mar_100": 0.7422, "eval_mar_100_layer_floorplan": 0.726, "eval_mar_100_layer_non_floorplan": 0.7583, "eval_mar_large": 0.7424, "eval_mar_medium": 0.4, "eval_mar_small": 0.0, "eval_runtime": 98.0807, "eval_samples_per_second": 22.42, "eval_steps_per_second": 1.407, "step": 9904 }, { "epoch": 17.0, "grad_norm": 10.991700172424316, "learning_rate": 3.3e-05, "loss": 0.5071, "step": 10523 }, { "epoch": 17.0, "eval_loss": 0.9921765923500061, "eval_map": 0.5737, "eval_map_50": 0.7827, "eval_map_75": 0.6516, "eval_map_large": 0.5739, "eval_map_layer_floorplan": 0.5805, "eval_map_layer_non_floorplan": 0.567, "eval_map_medium": 0.303, "eval_map_small": 0.0, "eval_mar_1": 0.5194, "eval_mar_10": 0.7465, "eval_mar_100": 0.7525, "eval_mar_100_layer_floorplan": 0.7471, "eval_mar_100_layer_non_floorplan": 0.7579, "eval_mar_large": 0.7528, "eval_mar_medium": 0.3, "eval_mar_small": 0.0, "eval_runtime": 114.1971, "eval_samples_per_second": 19.256, "eval_steps_per_second": 1.208, "step": 10523 }, { "epoch": 18.0, "grad_norm": 11.373696327209473, "learning_rate": 3.2000000000000005e-05, "loss": 0.4895, "step": 11142 }, { "epoch": 18.0, "eval_loss": 0.9796280860900879, "eval_map": 0.5763, "eval_map_50": 0.7822, "eval_map_75": 0.6614, "eval_map_large": 0.5767, "eval_map_layer_floorplan": 0.5869, "eval_map_layer_non_floorplan": 0.5658, "eval_map_medium": 0.101, "eval_map_small": 0.0, "eval_mar_1": 0.5269, "eval_mar_10": 0.7526, "eval_mar_100": 0.7583, "eval_mar_100_layer_floorplan": 0.7582, "eval_mar_100_layer_non_floorplan": 0.7584, "eval_mar_large": 0.7587, "eval_mar_medium": 0.1, "eval_mar_small": 0.0, "eval_runtime": 164.2202, "eval_samples_per_second": 13.391, "eval_steps_per_second": 0.84, "step": 11142 }, { "epoch": 19.0, "grad_norm": 15.639002799987793, "learning_rate": 3.1e-05, "loss": 0.4784, "step": 11761 }, { "epoch": 19.0, "eval_loss": 0.9923657774925232, "eval_map": 0.5794, "eval_map_50": 0.7862, "eval_map_75": 0.6607, "eval_map_large": 0.5797, "eval_map_layer_floorplan": 0.5907, "eval_map_layer_non_floorplan": 0.5682, "eval_map_medium": 0.2525, "eval_map_small": 0.0, "eval_mar_1": 0.5286, "eval_mar_10": 0.7549, "eval_mar_100": 0.7611, "eval_mar_100_layer_floorplan": 0.76, "eval_mar_100_layer_non_floorplan": 0.7623, "eval_mar_large": 0.7614, "eval_mar_medium": 0.25, "eval_mar_small": 0.0, "eval_runtime": 148.8739, "eval_samples_per_second": 14.771, "eval_steps_per_second": 0.927, "step": 11761 }, { "epoch": 20.0, "grad_norm": 11.518092155456543, "learning_rate": 3e-05, "loss": 0.4621, "step": 12380 }, { "epoch": 20.0, "eval_loss": 0.9944785833358765, "eval_map": 0.5815, "eval_map_50": 0.7851, "eval_map_75": 0.6678, "eval_map_large": 0.5816, "eval_map_layer_floorplan": 0.5936, "eval_map_layer_non_floorplan": 0.5694, "eval_map_medium": 0.404, "eval_map_small": 0.0, "eval_mar_1": 0.53, "eval_mar_10": 0.7575, "eval_mar_100": 0.7625, "eval_mar_100_layer_floorplan": 0.7674, "eval_mar_100_layer_non_floorplan": 0.7576, "eval_mar_large": 0.7628, "eval_mar_medium": 0.4, "eval_mar_small": 0.0, "eval_runtime": 150.1731, "eval_samples_per_second": 14.643, "eval_steps_per_second": 0.919, "step": 12380 }, { "epoch": 21.0, "grad_norm": 11.369315147399902, "learning_rate": 2.9e-05, "loss": 0.4484, "step": 12999 }, { "epoch": 21.0, "eval_loss": 1.0060081481933594, "eval_map": 0.5747, "eval_map_50": 0.7778, "eval_map_75": 0.6543, "eval_map_large": 0.575, "eval_map_layer_floorplan": 0.5877, "eval_map_layer_non_floorplan": 0.5617, "eval_map_medium": 0.202, "eval_map_small": 0.0, "eval_mar_1": 0.5261, "eval_mar_10": 0.7515, "eval_mar_100": 0.7567, "eval_mar_100_layer_floorplan": 0.7567, "eval_mar_100_layer_non_floorplan": 0.7567, "eval_mar_large": 0.7571, "eval_mar_medium": 0.2, "eval_mar_small": 0.0, "eval_runtime": 129.9803, "eval_samples_per_second": 16.918, "eval_steps_per_second": 1.062, "step": 12999 }, { "epoch": 22.0, "grad_norm": 14.859123229980469, "learning_rate": 2.8000000000000003e-05, "loss": 0.4358, "step": 13618 }, { "epoch": 22.0, "eval_loss": 0.9802154898643494, "eval_map": 0.5826, "eval_map_50": 0.7803, "eval_map_75": 0.6678, "eval_map_large": 0.5829, "eval_map_layer_floorplan": 0.5968, "eval_map_layer_non_floorplan": 0.5683, "eval_map_medium": 0.0505, "eval_map_small": 0.0, "eval_mar_1": 0.5264, "eval_mar_10": 0.7593, "eval_mar_100": 0.7652, "eval_mar_100_layer_floorplan": 0.7666, "eval_mar_100_layer_non_floorplan": 0.7638, "eval_mar_large": 0.7656, "eval_mar_medium": 0.05, "eval_mar_small": 0.0, "eval_runtime": 127.1201, "eval_samples_per_second": 17.299, "eval_steps_per_second": 1.086, "step": 13618 }, { "epoch": 23.0, "grad_norm": 12.832348823547363, "learning_rate": 2.7000000000000002e-05, "loss": 0.4236, "step": 14237 }, { "epoch": 23.0, "eval_loss": 1.0017343759536743, "eval_map": 0.5854, "eval_map_50": 0.7887, "eval_map_75": 0.671, "eval_map_large": 0.5858, "eval_map_layer_floorplan": 0.6009, "eval_map_layer_non_floorplan": 0.5699, "eval_map_medium": 0.0, "eval_map_small": 0.0, "eval_mar_1": 0.5276, "eval_mar_10": 0.7597, "eval_mar_100": 0.7648, "eval_mar_100_layer_floorplan": 0.768, "eval_mar_100_layer_non_floorplan": 0.7616, "eval_mar_large": 0.7652, "eval_mar_medium": 0.0, "eval_mar_small": 0.0, "eval_runtime": 219.2113, "eval_samples_per_second": 10.031, "eval_steps_per_second": 0.63, "step": 14237 } ], "logging_steps": 500, "max_steps": 30950, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 5, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 1.4729502081028093e+20, "train_batch_size": 32, "trial_name": null, "trial_params": null }