sedrickkeh's picture
Training in progress, epoch 2
a202694 verified
{"current_steps": 1, "total_steps": 186, "loss": 0.7913, "lr": 4.210526315789474e-06, "epoch": 0.016, "percentage": 0.54, "elapsed_time": "0:04:34", "remaining_time": "14:06:05"}
{"current_steps": 2, "total_steps": 186, "loss": 0.7915, "lr": 8.421052631578948e-06, "epoch": 0.032, "percentage": 1.08, "elapsed_time": "0:08:11", "remaining_time": "12:34:01"}
{"current_steps": 3, "total_steps": 186, "loss": 0.7505, "lr": 1.263157894736842e-05, "epoch": 0.048, "percentage": 1.61, "elapsed_time": "0:11:49", "remaining_time": "12:01:33"}
{"current_steps": 4, "total_steps": 186, "loss": 0.6908, "lr": 1.6842105263157896e-05, "epoch": 0.064, "percentage": 2.15, "elapsed_time": "0:15:27", "remaining_time": "11:42:58"}
{"current_steps": 5, "total_steps": 186, "loss": 0.7192, "lr": 2.105263157894737e-05, "epoch": 0.08, "percentage": 2.69, "elapsed_time": "0:19:04", "remaining_time": "11:30:38"}
{"current_steps": 6, "total_steps": 186, "loss": 0.7618, "lr": 2.526315789473684e-05, "epoch": 0.096, "percentage": 3.23, "elapsed_time": "0:22:42", "remaining_time": "11:21:17"}
{"current_steps": 7, "total_steps": 186, "loss": 0.7162, "lr": 2.9473684210526317e-05, "epoch": 0.112, "percentage": 3.76, "elapsed_time": "0:26:19", "remaining_time": "11:13:16"}
{"current_steps": 8, "total_steps": 186, "loss": 0.6638, "lr": 3.368421052631579e-05, "epoch": 0.128, "percentage": 4.3, "elapsed_time": "0:29:57", "remaining_time": "11:06:35"}
{"current_steps": 9, "total_steps": 186, "loss": 0.6244, "lr": 3.789473684210526e-05, "epoch": 0.144, "percentage": 4.84, "elapsed_time": "0:33:35", "remaining_time": "11:00:37"}
{"current_steps": 10, "total_steps": 186, "loss": 0.6009, "lr": 4.210526315789474e-05, "epoch": 0.16, "percentage": 5.38, "elapsed_time": "0:37:13", "remaining_time": "10:55:03"}
{"current_steps": 11, "total_steps": 186, "loss": 0.5816, "lr": 4.6315789473684214e-05, "epoch": 0.176, "percentage": 5.91, "elapsed_time": "0:40:50", "remaining_time": "10:49:46"}
{"current_steps": 12, "total_steps": 186, "loss": 0.6001, "lr": 5.052631578947368e-05, "epoch": 0.192, "percentage": 6.45, "elapsed_time": "0:44:28", "remaining_time": "10:44:46"}
{"current_steps": 13, "total_steps": 186, "loss": 0.5923, "lr": 5.4736842105263165e-05, "epoch": 0.208, "percentage": 6.99, "elapsed_time": "0:48:05", "remaining_time": "10:40:01"}
{"current_steps": 14, "total_steps": 186, "loss": 0.5706, "lr": 5.8947368421052634e-05, "epoch": 0.224, "percentage": 7.53, "elapsed_time": "0:51:43", "remaining_time": "10:35:26"}
{"current_steps": 15, "total_steps": 186, "loss": 0.5565, "lr": 6.315789473684212e-05, "epoch": 0.24, "percentage": 8.06, "elapsed_time": "0:55:21", "remaining_time": "10:31:01"}
{"current_steps": 16, "total_steps": 186, "loss": 0.5475, "lr": 6.736842105263159e-05, "epoch": 0.256, "percentage": 8.6, "elapsed_time": "0:58:58", "remaining_time": "10:26:39"}
{"current_steps": 17, "total_steps": 186, "loss": 0.6018, "lr": 7.157894736842105e-05, "epoch": 0.272, "percentage": 9.14, "elapsed_time": "1:02:36", "remaining_time": "10:22:21"}
{"current_steps": 18, "total_steps": 186, "loss": 0.5425, "lr": 7.578947368421052e-05, "epoch": 0.288, "percentage": 9.68, "elapsed_time": "1:06:13", "remaining_time": "10:18:06"}
{"current_steps": 19, "total_steps": 186, "loss": 0.554, "lr": 8e-05, "epoch": 0.304, "percentage": 10.22, "elapsed_time": "1:09:51", "remaining_time": "10:13:57"}
{"current_steps": 20, "total_steps": 186, "loss": 0.5573, "lr": 7.999292243297167e-05, "epoch": 0.32, "percentage": 10.75, "elapsed_time": "1:13:28", "remaining_time": "10:09:50"}
{"current_steps": 21, "total_steps": 186, "loss": 0.5248, "lr": 7.997169223648443e-05, "epoch": 0.336, "percentage": 11.29, "elapsed_time": "1:17:06", "remaining_time": "10:05:50"}
{"current_steps": 22, "total_steps": 186, "loss": 0.5208, "lr": 7.993631692344518e-05, "epoch": 0.352, "percentage": 11.83, "elapsed_time": "1:20:43", "remaining_time": "10:01:47"}
{"current_steps": 23, "total_steps": 186, "loss": 0.5215, "lr": 7.988680901241142e-05, "epoch": 0.368, "percentage": 12.37, "elapsed_time": "1:24:21", "remaining_time": "9:57:48"}
{"current_steps": 24, "total_steps": 186, "loss": 0.5076, "lr": 7.982318602316107e-05, "epoch": 0.384, "percentage": 12.9, "elapsed_time": "1:27:59", "remaining_time": "9:53:53"}
{"current_steps": 25, "total_steps": 186, "loss": 0.5094, "lr": 7.974547047049269e-05, "epoch": 0.4, "percentage": 13.44, "elapsed_time": "1:31:36", "remaining_time": "9:49:57"}
{"current_steps": 26, "total_steps": 186, "loss": 0.5012, "lr": 7.965368985625792e-05, "epoch": 0.416, "percentage": 13.98, "elapsed_time": "1:35:14", "remaining_time": "9:46:05"}
{"current_steps": 27, "total_steps": 186, "loss": 0.5007, "lr": 7.954787665962922e-05, "epoch": 0.432, "percentage": 14.52, "elapsed_time": "1:38:51", "remaining_time": "9:42:11"}
{"current_steps": 28, "total_steps": 186, "loss": 0.4822, "lr": 7.94280683256062e-05, "epoch": 0.448, "percentage": 15.05, "elapsed_time": "1:42:28", "remaining_time": "9:38:17"}
{"current_steps": 29, "total_steps": 186, "loss": 0.4889, "lr": 7.929430725176456e-05, "epoch": 0.464, "percentage": 15.59, "elapsed_time": "1:46:06", "remaining_time": "9:34:27"}
{"current_steps": 30, "total_steps": 186, "loss": 0.4762, "lr": 7.91466407732526e-05, "epoch": 0.48, "percentage": 16.13, "elapsed_time": "1:49:44", "remaining_time": "9:30:37"}
{"current_steps": 31, "total_steps": 186, "loss": 0.4726, "lr": 7.898512114604028e-05, "epoch": 0.496, "percentage": 16.67, "elapsed_time": "1:53:21", "remaining_time": "9:26:49"}
{"current_steps": 32, "total_steps": 186, "loss": 0.4785, "lr": 7.880980552842705e-05, "epoch": 0.512, "percentage": 17.2, "elapsed_time": "1:56:59", "remaining_time": "9:23:00"}
{"current_steps": 33, "total_steps": 186, "loss": 0.4755, "lr": 7.862075596081459e-05, "epoch": 0.528, "percentage": 17.74, "elapsed_time": "2:00:36", "remaining_time": "9:19:13"}
{"current_steps": 34, "total_steps": 186, "loss": 0.473, "lr": 7.841803934375226e-05, "epoch": 0.544, "percentage": 18.28, "elapsed_time": "2:04:14", "remaining_time": "9:15:25"}
{"current_steps": 35, "total_steps": 186, "loss": 0.4751, "lr": 7.820172741426231e-05, "epoch": 0.56, "percentage": 18.82, "elapsed_time": "2:07:52", "remaining_time": "9:11:40"}
{"current_steps": 36, "total_steps": 186, "loss": 0.4702, "lr": 7.79718967204537e-05, "epoch": 0.576, "percentage": 19.35, "elapsed_time": "2:11:30", "remaining_time": "9:07:56"}
{"current_steps": 37, "total_steps": 186, "loss": 0.4747, "lr": 7.772862859443352e-05, "epoch": 0.592, "percentage": 19.89, "elapsed_time": "2:15:08", "remaining_time": "9:04:12"}
{"current_steps": 38, "total_steps": 186, "loss": 0.4649, "lr": 7.747200912352512e-05, "epoch": 0.608, "percentage": 20.43, "elapsed_time": "2:18:46", "remaining_time": "9:00:29"}
{"current_steps": 39, "total_steps": 186, "loss": 0.4545, "lr": 7.72021291198038e-05, "epoch": 0.624, "percentage": 20.97, "elapsed_time": "2:22:24", "remaining_time": "8:56:45"}
{"current_steps": 40, "total_steps": 186, "loss": 0.4614, "lr": 7.691908408796038e-05, "epoch": 0.64, "percentage": 21.51, "elapsed_time": "2:26:02", "remaining_time": "8:53:01"}
{"current_steps": 41, "total_steps": 186, "loss": 0.4573, "lr": 7.66229741915041e-05, "epoch": 0.656, "percentage": 22.04, "elapsed_time": "2:29:39", "remaining_time": "8:49:17"}
{"current_steps": 42, "total_steps": 186, "loss": 0.4548, "lr": 7.631390421731695e-05, "epoch": 0.672, "percentage": 22.58, "elapsed_time": "2:33:17", "remaining_time": "8:45:33"}
{"current_steps": 43, "total_steps": 186, "loss": 0.4531, "lr": 7.599198353857187e-05, "epoch": 0.688, "percentage": 23.12, "elapsed_time": "2:36:54", "remaining_time": "8:41:48"}
{"current_steps": 44, "total_steps": 186, "loss": 0.4525, "lr": 7.565732607602794e-05, "epoch": 0.704, "percentage": 23.66, "elapsed_time": "2:40:32", "remaining_time": "8:38:07"}
{"current_steps": 45, "total_steps": 186, "loss": 0.4613, "lr": 7.53100502577163e-05, "epoch": 0.72, "percentage": 24.19, "elapsed_time": "2:44:10", "remaining_time": "8:34:24"}
{"current_steps": 46, "total_steps": 186, "loss": 0.4476, "lr": 7.495027897703102e-05, "epoch": 0.736, "percentage": 24.73, "elapsed_time": "2:47:48", "remaining_time": "8:30:42"}
{"current_steps": 47, "total_steps": 186, "loss": 0.456, "lr": 7.457813954923979e-05, "epoch": 0.752, "percentage": 25.27, "elapsed_time": "2:51:25", "remaining_time": "8:26:59"}
{"current_steps": 48, "total_steps": 186, "loss": 0.4602, "lr": 7.419376366642982e-05, "epoch": 0.768, "percentage": 25.81, "elapsed_time": "2:55:03", "remaining_time": "8:23:16"}
{"current_steps": 49, "total_steps": 186, "loss": 0.4489, "lr": 7.379728735090483e-05, "epoch": 0.784, "percentage": 26.34, "elapsed_time": "2:58:40", "remaining_time": "8:19:34"}
{"current_steps": 50, "total_steps": 186, "loss": 0.4426, "lr": 7.338885090704975e-05, "epoch": 0.8, "percentage": 26.88, "elapsed_time": "3:02:18", "remaining_time": "8:15:51"}
{"current_steps": 51, "total_steps": 186, "loss": 0.4452, "lr": 7.296859887167997e-05, "epoch": 0.816, "percentage": 27.42, "elapsed_time": "3:05:55", "remaining_time": "8:12:09"}
{"current_steps": 52, "total_steps": 186, "loss": 0.4458, "lr": 7.253667996289298e-05, "epoch": 0.832, "percentage": 27.96, "elapsed_time": "3:09:33", "remaining_time": "8:08:27"}
{"current_steps": 53, "total_steps": 186, "loss": 0.4396, "lr": 7.209324702744015e-05, "epoch": 0.848, "percentage": 28.49, "elapsed_time": "3:13:10", "remaining_time": "8:04:45"}
{"current_steps": 54, "total_steps": 186, "loss": 0.4287, "lr": 7.163845698663763e-05, "epoch": 0.864, "percentage": 29.03, "elapsed_time": "3:16:48", "remaining_time": "8:01:04"}
{"current_steps": 55, "total_steps": 186, "loss": 0.4327, "lr": 7.117247078083531e-05, "epoch": 0.88, "percentage": 29.57, "elapsed_time": "3:20:25", "remaining_time": "7:57:23"}
{"current_steps": 56, "total_steps": 186, "loss": 0.4245, "lr": 7.069545331246348e-05, "epoch": 0.896, "percentage": 30.11, "elapsed_time": "3:24:03", "remaining_time": "7:53:42"}
{"current_steps": 57, "total_steps": 186, "loss": 0.429, "lr": 7.020757338767745e-05, "epoch": 0.912, "percentage": 30.65, "elapsed_time": "3:27:41", "remaining_time": "7:50:01"}
{"current_steps": 58, "total_steps": 186, "loss": 0.4274, "lr": 6.970900365662068e-05, "epoch": 0.928, "percentage": 31.18, "elapsed_time": "3:31:18", "remaining_time": "7:46:20"}
{"current_steps": 59, "total_steps": 186, "loss": 0.4349, "lr": 6.919992055232768e-05, "epoch": 0.944, "percentage": 31.72, "elapsed_time": "3:34:56", "remaining_time": "7:42:40"}
{"current_steps": 60, "total_steps": 186, "loss": 0.4277, "lr": 6.868050422828812e-05, "epoch": 0.96, "percentage": 32.26, "elapsed_time": "3:38:34", "remaining_time": "7:38:59"}
{"current_steps": 61, "total_steps": 186, "loss": 0.4296, "lr": 6.815093849469446e-05, "epoch": 0.976, "percentage": 32.8, "elapsed_time": "3:42:11", "remaining_time": "7:35:19"}
{"current_steps": 62, "total_steps": 186, "loss": 0.4256, "lr": 6.761141075339546e-05, "epoch": 0.992, "percentage": 33.33, "elapsed_time": "3:45:49", "remaining_time": "7:31:38"}
{"current_steps": 63, "total_steps": 186, "loss": 0.7285, "lr": 6.706211193157875e-05, "epoch": 1.012, "percentage": 33.87, "elapsed_time": "3:50:55", "remaining_time": "7:30:50"}
{"current_steps": 64, "total_steps": 186, "loss": 0.4151, "lr": 6.650323641420585e-05, "epoch": 1.028, "percentage": 34.41, "elapsed_time": "3:54:32", "remaining_time": "7:27:06"}
{"current_steps": 65, "total_steps": 186, "loss": 0.4082, "lr": 6.593498197522348e-05, "epoch": 1.044, "percentage": 34.95, "elapsed_time": "3:58:10", "remaining_time": "7:23:22"}
{"current_steps": 66, "total_steps": 186, "loss": 0.4055, "lr": 6.535754970757567e-05, "epoch": 1.06, "percentage": 35.48, "elapsed_time": "4:01:47", "remaining_time": "7:19:38"}
{"current_steps": 67, "total_steps": 186, "loss": 0.4079, "lr": 6.477114395204142e-05, "epoch": 1.076, "percentage": 36.02, "elapsed_time": "4:05:25", "remaining_time": "7:15:54"}
{"current_steps": 68, "total_steps": 186, "loss": 0.4013, "lr": 6.417597222492268e-05, "epoch": 1.092, "percentage": 36.56, "elapsed_time": "4:09:02", "remaining_time": "7:12:10"}
{"current_steps": 69, "total_steps": 186, "loss": 0.4065, "lr": 6.35722451446091e-05, "epoch": 1.108, "percentage": 37.1, "elapsed_time": "4:12:40", "remaining_time": "7:08:26"}
{"current_steps": 70, "total_steps": 186, "loss": 0.3964, "lr": 6.296017635704455e-05, "epoch": 1.124, "percentage": 37.63, "elapsed_time": "4:16:17", "remaining_time": "7:04:43"}
{"current_steps": 71, "total_steps": 186, "loss": 0.4053, "lr": 6.233998246012253e-05, "epoch": 1.1400000000000001, "percentage": 38.17, "elapsed_time": "4:19:55", "remaining_time": "7:01:00"}
{"current_steps": 72, "total_steps": 186, "loss": 0.3926, "lr": 6.171188292703685e-05, "epoch": 1.156, "percentage": 38.71, "elapsed_time": "4:23:33", "remaining_time": "6:57:18"}
{"current_steps": 73, "total_steps": 186, "loss": 0.3957, "lr": 6.10761000286148e-05, "epoch": 1.172, "percentage": 39.25, "elapsed_time": "4:27:11", "remaining_time": "6:53:35"}
{"current_steps": 74, "total_steps": 186, "loss": 0.401, "lr": 6.043285875466032e-05, "epoch": 1.188, "percentage": 39.78, "elapsed_time": "4:30:48", "remaining_time": "6:49:52"}
{"current_steps": 75, "total_steps": 186, "loss": 0.4009, "lr": 5.978238673433502e-05, "epoch": 1.204, "percentage": 40.32, "elapsed_time": "4:34:26", "remaining_time": "6:46:09"}
{"current_steps": 76, "total_steps": 186, "loss": 0.3976, "lr": 5.912491415560507e-05, "epoch": 1.22, "percentage": 40.86, "elapsed_time": "4:38:03", "remaining_time": "6:42:27"}
{"current_steps": 77, "total_steps": 186, "loss": 0.3983, "lr": 5.8460673683782756e-05, "epoch": 1.236, "percentage": 41.4, "elapsed_time": "4:41:40", "remaining_time": "6:38:44"}
{"current_steps": 78, "total_steps": 186, "loss": 0.3989, "lr": 5.7789900379191186e-05, "epoch": 1.252, "percentage": 41.94, "elapsed_time": "4:45:18", "remaining_time": "6:35:01"}
{"current_steps": 79, "total_steps": 186, "loss": 0.3995, "lr": 5.7112831613981554e-05, "epoch": 1.268, "percentage": 42.47, "elapsed_time": "4:48:55", "remaining_time": "6:31:19"}
{"current_steps": 80, "total_steps": 186, "loss": 0.3968, "lr": 5.64297069881323e-05, "epoch": 1.284, "percentage": 43.01, "elapsed_time": "4:52:32", "remaining_time": "6:27:36"}
{"current_steps": 81, "total_steps": 186, "loss": 0.3963, "lr": 5.574076824465983e-05, "epoch": 1.3, "percentage": 43.55, "elapsed_time": "4:56:09", "remaining_time": "6:23:55"}
{"current_steps": 82, "total_steps": 186, "loss": 0.3985, "lr": 5.5046259184070894e-05, "epoch": 1.316, "percentage": 44.09, "elapsed_time": "4:59:47", "remaining_time": "6:20:13"}
{"current_steps": 83, "total_steps": 186, "loss": 0.3893, "lr": 5.4346425578086915e-05, "epoch": 1.332, "percentage": 44.62, "elapsed_time": "5:03:24", "remaining_time": "6:16:31"}
{"current_steps": 84, "total_steps": 186, "loss": 0.3927, "lr": 5.364151508267064e-05, "epoch": 1.3479999999999999, "percentage": 45.16, "elapsed_time": "5:07:02", "remaining_time": "6:12:49"}
{"current_steps": 85, "total_steps": 186, "loss": 0.3913, "lr": 5.293177715038608e-05, "epoch": 1.3639999999999999, "percentage": 45.7, "elapsed_time": "5:10:39", "remaining_time": "6:09:08"}
{"current_steps": 86, "total_steps": 186, "loss": 0.3893, "lr": 5.2217462942122664e-05, "epoch": 1.38, "percentage": 46.24, "elapsed_time": "5:14:16", "remaining_time": "6:05:26"}
{"current_steps": 87, "total_steps": 186, "loss": 0.3903, "lr": 5.1498825238214786e-05, "epoch": 1.396, "percentage": 46.77, "elapsed_time": "5:17:54", "remaining_time": "6:01:45"}
{"current_steps": 88, "total_steps": 186, "loss": 0.3974, "lr": 5.077611834898839e-05, "epoch": 1.412, "percentage": 47.31, "elapsed_time": "5:21:32", "remaining_time": "5:58:04"}
{"current_steps": 89, "total_steps": 186, "loss": 0.3912, "lr": 5.004959802476596e-05, "epoch": 1.428, "percentage": 47.85, "elapsed_time": "5:25:09", "remaining_time": "5:54:23"}
{"current_steps": 90, "total_steps": 186, "loss": 0.3898, "lr": 4.931952136536213e-05, "epoch": 1.444, "percentage": 48.39, "elapsed_time": "5:28:47", "remaining_time": "5:50:42"}
{"current_steps": 91, "total_steps": 186, "loss": 0.3902, "lr": 4.858614672910155e-05, "epoch": 1.46, "percentage": 48.92, "elapsed_time": "5:32:24", "remaining_time": "5:47:01"}
{"current_steps": 92, "total_steps": 186, "loss": 0.389, "lr": 4.784973364139144e-05, "epoch": 1.476, "percentage": 49.46, "elapsed_time": "5:36:02", "remaining_time": "5:43:20"}
{"current_steps": 93, "total_steps": 186, "loss": 0.3923, "lr": 4.711054270288125e-05, "epoch": 1.492, "percentage": 50.0, "elapsed_time": "5:39:39", "remaining_time": "5:39:39"}
{"current_steps": 94, "total_steps": 186, "loss": 0.3915, "lr": 4.6368835497241704e-05, "epoch": 1.508, "percentage": 50.54, "elapsed_time": "5:43:17", "remaining_time": "5:35:58"}
{"current_steps": 95, "total_steps": 186, "loss": 0.3868, "lr": 4.562487449859594e-05, "epoch": 1.524, "percentage": 51.08, "elapsed_time": "5:46:54", "remaining_time": "5:32:18"}
{"current_steps": 96, "total_steps": 186, "loss": 0.3901, "lr": 4.4878922978635686e-05, "epoch": 1.54, "percentage": 51.61, "elapsed_time": "5:50:32", "remaining_time": "5:28:37"}
{"current_steps": 97, "total_steps": 186, "loss": 0.3918, "lr": 4.4131244913455064e-05, "epoch": 1.556, "percentage": 52.15, "elapsed_time": "5:54:10", "remaining_time": "5:24:57"}
{"current_steps": 98, "total_steps": 186, "loss": 0.3857, "lr": 4.3382104890135164e-05, "epoch": 1.572, "percentage": 52.69, "elapsed_time": "5:57:47", "remaining_time": "5:21:17"}
{"current_steps": 99, "total_steps": 186, "loss": 0.3872, "lr": 4.263176801311243e-05, "epoch": 1.588, "percentage": 53.23, "elapsed_time": "6:01:25", "remaining_time": "5:17:36"}
{"current_steps": 100, "total_steps": 186, "loss": 0.386, "lr": 4.1880499810363906e-05, "epoch": 1.604, "percentage": 53.76, "elapsed_time": "6:05:02", "remaining_time": "5:13:56"}
{"current_steps": 101, "total_steps": 186, "loss": 0.3858, "lr": 4.112856613944265e-05, "epoch": 1.62, "percentage": 54.3, "elapsed_time": "6:08:40", "remaining_time": "5:10:16"}
{"current_steps": 102, "total_steps": 186, "loss": 0.3867, "lr": 4.03762330933965e-05, "epoch": 1.6360000000000001, "percentage": 54.84, "elapsed_time": "6:12:17", "remaining_time": "5:06:35"}
{"current_steps": 103, "total_steps": 186, "loss": 0.3818, "lr": 3.962376690660352e-05, "epoch": 1.6520000000000001, "percentage": 55.38, "elapsed_time": "6:15:55", "remaining_time": "5:02:55"}
{"current_steps": 104, "total_steps": 186, "loss": 0.3856, "lr": 3.8871433860557365e-05, "epoch": 1.6680000000000001, "percentage": 55.91, "elapsed_time": "6:19:32", "remaining_time": "4:59:15"}
{"current_steps": 105, "total_steps": 186, "loss": 0.389, "lr": 3.811950018963611e-05, "epoch": 1.6840000000000002, "percentage": 56.45, "elapsed_time": "6:23:10", "remaining_time": "4:55:35"}
{"current_steps": 106, "total_steps": 186, "loss": 0.3876, "lr": 3.736823198688758e-05, "epoch": 1.7, "percentage": 56.99, "elapsed_time": "6:26:48", "remaining_time": "4:51:55"}
{"current_steps": 107, "total_steps": 186, "loss": 0.3849, "lr": 3.6617895109864836e-05, "epoch": 1.716, "percentage": 57.53, "elapsed_time": "6:30:26", "remaining_time": "4:48:15"}
{"current_steps": 108, "total_steps": 186, "loss": 0.3881, "lr": 3.586875508654495e-05, "epoch": 1.732, "percentage": 58.06, "elapsed_time": "6:34:03", "remaining_time": "4:44:36"}
{"current_steps": 109, "total_steps": 186, "loss": 0.3882, "lr": 3.512107702136432e-05, "epoch": 1.748, "percentage": 58.6, "elapsed_time": "6:37:41", "remaining_time": "4:40:56"}
{"current_steps": 110, "total_steps": 186, "loss": 0.3796, "lr": 3.437512550140408e-05, "epoch": 1.764, "percentage": 59.14, "elapsed_time": "6:41:19", "remaining_time": "4:37:16"}
{"current_steps": 111, "total_steps": 186, "loss": 0.3807, "lr": 3.363116450275831e-05, "epoch": 1.78, "percentage": 59.68, "elapsed_time": "6:44:57", "remaining_time": "4:33:36"}
{"current_steps": 112, "total_steps": 186, "loss": 0.3898, "lr": 3.2889457297118754e-05, "epoch": 1.796, "percentage": 60.22, "elapsed_time": "6:48:35", "remaining_time": "4:29:57"}
{"current_steps": 113, "total_steps": 186, "loss": 0.3829, "lr": 3.2150266358608566e-05, "epoch": 1.812, "percentage": 60.75, "elapsed_time": "6:52:13", "remaining_time": "4:26:18"}
{"current_steps": 114, "total_steps": 186, "loss": 0.3831, "lr": 3.1413853270898456e-05, "epoch": 1.8279999999999998, "percentage": 61.29, "elapsed_time": "6:55:50", "remaining_time": "4:22:38"}
{"current_steps": 115, "total_steps": 186, "loss": 0.3797, "lr": 3.0680478634637876e-05, "epoch": 1.8439999999999999, "percentage": 61.83, "elapsed_time": "6:59:27", "remaining_time": "4:18:58"}
{"current_steps": 116, "total_steps": 186, "loss": 0.3784, "lr": 2.9950401975234053e-05, "epoch": 1.8599999999999999, "percentage": 62.37, "elapsed_time": "7:03:05", "remaining_time": "4:15:18"}
{"current_steps": 117, "total_steps": 186, "loss": 0.38, "lr": 2.922388165101164e-05, "epoch": 1.876, "percentage": 62.9, "elapsed_time": "7:06:43", "remaining_time": "4:11:39"}
{"current_steps": 118, "total_steps": 186, "loss": 0.383, "lr": 2.8501174761785227e-05, "epoch": 1.892, "percentage": 63.44, "elapsed_time": "7:10:20", "remaining_time": "4:07:59"}
{"current_steps": 119, "total_steps": 186, "loss": 0.3803, "lr": 2.7782537057877353e-05, "epoch": 1.908, "percentage": 63.98, "elapsed_time": "7:13:58", "remaining_time": "4:04:20"}
{"current_steps": 120, "total_steps": 186, "loss": 0.3828, "lr": 2.7068222849613924e-05, "epoch": 1.924, "percentage": 64.52, "elapsed_time": "7:17:35", "remaining_time": "4:00:40"}
{"current_steps": 121, "total_steps": 186, "loss": 0.3807, "lr": 2.635848491732936e-05, "epoch": 1.94, "percentage": 65.05, "elapsed_time": "7:21:13", "remaining_time": "3:57:01"}
{"current_steps": 122, "total_steps": 186, "loss": 0.3762, "lr": 2.56535744219131e-05, "epoch": 1.956, "percentage": 65.59, "elapsed_time": "7:24:51", "remaining_time": "3:53:21"}
{"current_steps": 123, "total_steps": 186, "loss": 0.3779, "lr": 2.4953740815929112e-05, "epoch": 1.972, "percentage": 66.13, "elapsed_time": "7:28:32", "remaining_time": "3:49:44"}
{"current_steps": 124, "total_steps": 186, "loss": 0.3772, "lr": 2.4259231755340185e-05, "epoch": 1.988, "percentage": 66.67, "elapsed_time": "7:32:13", "remaining_time": "3:46:06"}
{"current_steps": 125, "total_steps": 186, "loss": 0.6469, "lr": 2.3570293011867705e-05, "epoch": 2.008, "percentage": 67.2, "elapsed_time": "7:37:24", "remaining_time": "3:43:12"}
{"current_steps": 126, "total_steps": 186, "loss": 0.3551, "lr": 2.2887168386018446e-05, "epoch": 2.024, "percentage": 67.74, "elapsed_time": "7:41:01", "remaining_time": "3:39:32"}
{"current_steps": 127, "total_steps": 186, "loss": 0.3608, "lr": 2.221009962080883e-05, "epoch": 2.04, "percentage": 68.28, "elapsed_time": "7:44:38", "remaining_time": "3:35:51"}
{"current_steps": 128, "total_steps": 186, "loss": 0.3618, "lr": 2.153932631621725e-05, "epoch": 2.056, "percentage": 68.82, "elapsed_time": "7:48:15", "remaining_time": "3:32:10"}
{"current_steps": 129, "total_steps": 186, "loss": 0.36, "lr": 2.0875085844394933e-05, "epoch": 2.072, "percentage": 69.35, "elapsed_time": "7:51:53", "remaining_time": "3:28:30"}
{"current_steps": 130, "total_steps": 186, "loss": 0.366, "lr": 2.021761326566499e-05, "epoch": 2.088, "percentage": 69.89, "elapsed_time": "7:55:30", "remaining_time": "3:24:50"}
{"current_steps": 131, "total_steps": 186, "loss": 0.3577, "lr": 1.9567141245339695e-05, "epoch": 2.104, "percentage": 70.43, "elapsed_time": "7:59:08", "remaining_time": "3:21:09"}
{"current_steps": 132, "total_steps": 186, "loss": 0.3628, "lr": 1.8923899971385215e-05, "epoch": 2.12, "percentage": 70.97, "elapsed_time": "8:02:45", "remaining_time": "3:17:29"}
{"current_steps": 133, "total_steps": 186, "loss": 0.3596, "lr": 1.828811707296315e-05, "epoch": 2.136, "percentage": 71.51, "elapsed_time": "8:06:23", "remaining_time": "3:13:49"}
{"current_steps": 134, "total_steps": 186, "loss": 0.3576, "lr": 1.766001753987748e-05, "epoch": 2.152, "percentage": 72.04, "elapsed_time": "8:10:00", "remaining_time": "3:10:09"}
{"current_steps": 135, "total_steps": 186, "loss": 0.3625, "lr": 1.7039823642955458e-05, "epoch": 2.168, "percentage": 72.58, "elapsed_time": "8:13:38", "remaining_time": "3:06:29"}
{"current_steps": 136, "total_steps": 186, "loss": 0.3579, "lr": 1.642775485539092e-05, "epoch": 2.184, "percentage": 73.12, "elapsed_time": "8:17:15", "remaining_time": "3:02:49"}
{"current_steps": 137, "total_steps": 186, "loss": 0.3584, "lr": 1.5824027775077322e-05, "epoch": 2.2, "percentage": 73.66, "elapsed_time": "8:20:53", "remaining_time": "2:59:09"}
{"current_steps": 138, "total_steps": 186, "loss": 0.359, "lr": 1.5228856047958603e-05, "epoch": 2.216, "percentage": 74.19, "elapsed_time": "8:24:31", "remaining_time": "2:55:29"}
{"current_steps": 139, "total_steps": 186, "loss": 0.3659, "lr": 1.4642450292424326e-05, "epoch": 2.232, "percentage": 74.73, "elapsed_time": "8:28:08", "remaining_time": "2:51:49"}
{"current_steps": 140, "total_steps": 186, "loss": 0.3572, "lr": 1.4065018024776533e-05, "epoch": 2.248, "percentage": 75.27, "elapsed_time": "8:31:45", "remaining_time": "2:48:09"}
{"current_steps": 141, "total_steps": 186, "loss": 0.365, "lr": 1.3496763585794166e-05, "epoch": 2.2640000000000002, "percentage": 75.81, "elapsed_time": "8:35:23", "remaining_time": "2:44:29"}
{"current_steps": 142, "total_steps": 186, "loss": 0.3513, "lr": 1.2937888068421254e-05, "epoch": 2.2800000000000002, "percentage": 76.34, "elapsed_time": "8:39:01", "remaining_time": "2:40:49"}
{"current_steps": 143, "total_steps": 186, "loss": 0.3515, "lr": 1.238858924660456e-05, "epoch": 2.296, "percentage": 76.88, "elapsed_time": "8:42:38", "remaining_time": "2:37:09"}
{"current_steps": 144, "total_steps": 186, "loss": 0.3576, "lr": 1.184906150530555e-05, "epoch": 2.312, "percentage": 77.42, "elapsed_time": "8:46:16", "remaining_time": "2:33:29"}
{"current_steps": 145, "total_steps": 186, "loss": 0.3611, "lr": 1.1319495771711884e-05, "epoch": 2.328, "percentage": 77.96, "elapsed_time": "8:49:53", "remaining_time": "2:29:49"}
{"current_steps": 146, "total_steps": 186, "loss": 0.3584, "lr": 1.0800079447672318e-05, "epoch": 2.344, "percentage": 78.49, "elapsed_time": "8:53:31", "remaining_time": "2:26:10"}
{"current_steps": 147, "total_steps": 186, "loss": 0.3596, "lr": 1.0290996343379316e-05, "epoch": 2.36, "percentage": 79.03, "elapsed_time": "8:57:08", "remaining_time": "2:22:30"}
{"current_steps": 148, "total_steps": 186, "loss": 0.3631, "lr": 9.79242661232256e-06, "epoch": 2.376, "percentage": 79.57, "elapsed_time": "9:00:45", "remaining_time": "2:18:50"}
{"current_steps": 149, "total_steps": 186, "loss": 0.3597, "lr": 9.304546687536523e-06, "epoch": 2.392, "percentage": 80.11, "elapsed_time": "9:04:23", "remaining_time": "2:15:10"}
{"current_steps": 150, "total_steps": 186, "loss": 0.3593, "lr": 8.827529219164704e-06, "epoch": 2.408, "percentage": 80.65, "elapsed_time": "9:08:00", "remaining_time": "2:11:31"}
{"current_steps": 151, "total_steps": 186, "loss": 0.3578, "lr": 8.361543013362384e-06, "epoch": 2.424, "percentage": 81.18, "elapsed_time": "9:11:38", "remaining_time": "2:07:51"}
{"current_steps": 152, "total_steps": 186, "loss": 0.3564, "lr": 7.90675297255986e-06, "epoch": 2.44, "percentage": 81.72, "elapsed_time": "9:15:15", "remaining_time": "2:04:12"}
{"current_steps": 153, "total_steps": 186, "loss": 0.3555, "lr": 7.463320037107018e-06, "epoch": 2.456, "percentage": 82.26, "elapsed_time": "9:18:51", "remaining_time": "2:00:32"}
{"current_steps": 154, "total_steps": 186, "loss": 0.3618, "lr": 7.031401128320019e-06, "epoch": 2.472, "percentage": 82.8, "elapsed_time": "9:22:29", "remaining_time": "1:56:52"}
{"current_steps": 155, "total_steps": 186, "loss": 0.3623, "lr": 6.61114909295026e-06, "epoch": 2.488, "percentage": 83.33, "elapsed_time": "9:26:07", "remaining_time": "1:53:13"}
{"current_steps": 156, "total_steps": 186, "loss": 0.3576, "lr": 6.202712649095177e-06, "epoch": 2.504, "percentage": 83.87, "elapsed_time": "9:29:44", "remaining_time": "1:49:33"}
{"current_steps": 157, "total_steps": 186, "loss": 0.3618, "lr": 5.806236333570203e-06, "epoch": 2.52, "percentage": 84.41, "elapsed_time": "9:33:21", "remaining_time": "1:45:54"}
{"current_steps": 158, "total_steps": 186, "loss": 0.3573, "lr": 5.421860450760226e-06, "epoch": 2.536, "percentage": 84.95, "elapsed_time": "9:36:58", "remaining_time": "1:42:14"}
{"current_steps": 159, "total_steps": 186, "loss": 0.3555, "lr": 5.04972102296899e-06, "epoch": 2.552, "percentage": 85.48, "elapsed_time": "9:40:35", "remaining_time": "1:38:35"}
{"current_steps": 160, "total_steps": 186, "loss": 0.3596, "lr": 4.6899497422837035e-06, "epoch": 2.568, "percentage": 86.02, "elapsed_time": "9:44:13", "remaining_time": "1:34:56"}
{"current_steps": 161, "total_steps": 186, "loss": 0.3558, "lr": 4.34267392397206e-06, "epoch": 2.584, "percentage": 86.56, "elapsed_time": "9:47:50", "remaining_time": "1:31:16"}
{"current_steps": 162, "total_steps": 186, "loss": 0.3534, "lr": 4.0080164614281395e-06, "epoch": 2.6, "percentage": 87.1, "elapsed_time": "9:51:28", "remaining_time": "1:27:37"}
{"current_steps": 163, "total_steps": 186, "loss": 0.3596, "lr": 3.6860957826830545e-06, "epoch": 2.616, "percentage": 87.63, "elapsed_time": "9:55:05", "remaining_time": "1:23:58"}
{"current_steps": 164, "total_steps": 186, "loss": 0.3552, "lr": 3.377025808495913e-06, "epoch": 2.632, "percentage": 88.17, "elapsed_time": "9:58:44", "remaining_time": "1:20:19"}
{"current_steps": 165, "total_steps": 186, "loss": 0.3581, "lr": 3.080915912039628e-06, "epoch": 2.648, "percentage": 88.71, "elapsed_time": "10:02:21", "remaining_time": "1:16:39"}
{"current_steps": 166, "total_steps": 186, "loss": 0.3547, "lr": 2.797870880196203e-06, "epoch": 2.664, "percentage": 89.25, "elapsed_time": "10:05:59", "remaining_time": "1:13:00"}
{"current_steps": 167, "total_steps": 186, "loss": 0.3601, "lr": 2.527990876474893e-06, "epoch": 2.68, "percentage": 89.78, "elapsed_time": "10:09:36", "remaining_time": "1:09:21"}
{"current_steps": 168, "total_steps": 186, "loss": 0.3545, "lr": 2.271371405566485e-06, "epoch": 2.6959999999999997, "percentage": 90.32, "elapsed_time": "10:13:14", "remaining_time": "1:05:42"}
{"current_steps": 169, "total_steps": 186, "loss": 0.3553, "lr": 2.0281032795462963e-06, "epoch": 2.7119999999999997, "percentage": 90.86, "elapsed_time": "10:16:51", "remaining_time": "1:02:03"}
{"current_steps": 170, "total_steps": 186, "loss": 0.3575, "lr": 1.7982725857377036e-06, "epoch": 2.7279999999999998, "percentage": 91.4, "elapsed_time": "10:20:29", "remaining_time": "0:58:23"}
{"current_steps": 171, "total_steps": 186, "loss": 0.3552, "lr": 1.5819606562477475e-06, "epoch": 2.7439999999999998, "percentage": 91.94, "elapsed_time": "10:24:06", "remaining_time": "0:54:44"}
{"current_steps": 172, "total_steps": 186, "loss": 0.3559, "lr": 1.3792440391854122e-06, "epoch": 2.76, "percentage": 92.47, "elapsed_time": "10:27:44", "remaining_time": "0:51:05"}
{"current_steps": 173, "total_steps": 186, "loss": 0.3593, "lr": 1.190194471572963e-06, "epoch": 2.776, "percentage": 93.01, "elapsed_time": "10:31:21", "remaining_time": "0:47:26"}
{"current_steps": 174, "total_steps": 186, "loss": 0.3621, "lr": 1.0148788539597176e-06, "epoch": 2.792, "percentage": 93.55, "elapsed_time": "10:34:58", "remaining_time": "0:43:47"}
{"current_steps": 175, "total_steps": 186, "loss": 0.3589, "lr": 8.533592267474166e-07, "epoch": 2.808, "percentage": 94.09, "elapsed_time": "10:38:36", "remaining_time": "0:40:08"}
{"current_steps": 176, "total_steps": 186, "loss": 0.3563, "lr": 7.056927482354514e-07, "epoch": 2.824, "percentage": 94.62, "elapsed_time": "10:42:13", "remaining_time": "0:36:29"}
{"current_steps": 177, "total_steps": 186, "loss": 0.3547, "lr": 5.719316743938086e-07, "epoch": 2.84, "percentage": 95.16, "elapsed_time": "10:45:51", "remaining_time": "0:32:50"}
{"current_steps": 178, "total_steps": 186, "loss": 0.3514, "lr": 4.521233403707781e-07, "epoch": 2.856, "percentage": 95.7, "elapsed_time": "10:49:28", "remaining_time": "0:29:11"}
{"current_steps": 179, "total_steps": 186, "loss": 0.3576, "lr": 3.463101437420857e-07, "epoch": 2.872, "percentage": 96.24, "elapsed_time": "10:53:05", "remaining_time": "0:25:32"}
{"current_steps": 180, "total_steps": 186, "loss": 0.3496, "lr": 2.5452952950732136e-07, "epoch": 2.888, "percentage": 96.77, "elapsed_time": "10:56:43", "remaining_time": "0:21:53"}
{"current_steps": 181, "total_steps": 186, "loss": 0.3584, "lr": 1.768139768389343e-07, "epoch": 2.904, "percentage": 97.31, "elapsed_time": "11:00:20", "remaining_time": "0:18:14"}
{"current_steps": 182, "total_steps": 186, "loss": 0.3559, "lr": 1.1319098758858726e-07, "epoch": 2.92, "percentage": 97.85, "elapsed_time": "11:03:58", "remaining_time": "0:14:35"}
{"current_steps": 183, "total_steps": 186, "loss": 0.3566, "lr": 6.368307655482576e-08, "epoch": 2.936, "percentage": 98.39, "elapsed_time": "11:07:36", "remaining_time": "0:10:56"}
{"current_steps": 184, "total_steps": 186, "loss": 0.3628, "lr": 2.830776351558484e-08, "epoch": 2.952, "percentage": 98.92, "elapsed_time": "11:11:13", "remaining_time": "0:07:17"}
{"current_steps": 185, "total_steps": 186, "loss": 0.3557, "lr": 7.077567028335175e-09, "epoch": 2.968, "percentage": 99.46, "elapsed_time": "11:14:51", "remaining_time": "0:03:38"}
{"current_steps": 186, "total_steps": 186, "loss": 0.3594, "lr": 0.0, "epoch": 2.984, "percentage": 100.0, "elapsed_time": "11:18:28", "remaining_time": "0:00:00"}
{"current_steps": 186, "total_steps": 186, "epoch": 2.984, "percentage": 100.0, "elapsed_time": "11:20:02", "remaining_time": "0:00:00"}