openthoughts_30k_32B / trainer_log.jsonl
reinhardh's picture
Training in progress, epoch 4
02a1c20 verified
{"current_steps": 1, "total_steps": 125, "loss": 0.7558, "lr": 6.153846153846155e-06, "epoch": 0.03940886699507389, "percentage": 0.8, "elapsed_time": "0:03:32", "remaining_time": "7:18:37"}
{"current_steps": 2, "total_steps": 125, "loss": 0.7528, "lr": 1.230769230769231e-05, "epoch": 0.07881773399014778, "percentage": 1.6, "elapsed_time": "0:06:41", "remaining_time": "6:52:02"}
{"current_steps": 3, "total_steps": 125, "loss": 0.7189, "lr": 1.8461538461538465e-05, "epoch": 0.11822660098522167, "percentage": 2.4, "elapsed_time": "0:09:52", "remaining_time": "6:41:29"}
{"current_steps": 4, "total_steps": 125, "loss": 0.6998, "lr": 2.461538461538462e-05, "epoch": 0.15763546798029557, "percentage": 3.2, "elapsed_time": "0:13:02", "remaining_time": "6:34:40"}
{"current_steps": 5, "total_steps": 125, "loss": 0.639, "lr": 3.0769230769230774e-05, "epoch": 0.19704433497536947, "percentage": 4.0, "elapsed_time": "0:16:12", "remaining_time": "6:29:11"}
{"current_steps": 6, "total_steps": 125, "loss": 0.6071, "lr": 3.692307692307693e-05, "epoch": 0.23645320197044334, "percentage": 4.8, "elapsed_time": "0:19:23", "remaining_time": "6:24:27"}
{"current_steps": 7, "total_steps": 125, "loss": 0.6034, "lr": 4.307692307692308e-05, "epoch": 0.27586206896551724, "percentage": 5.6, "elapsed_time": "0:22:33", "remaining_time": "6:20:12"}
{"current_steps": 8, "total_steps": 125, "loss": 0.5724, "lr": 4.923076923076924e-05, "epoch": 0.31527093596059114, "percentage": 6.4, "elapsed_time": "0:25:43", "remaining_time": "6:16:11"}
{"current_steps": 9, "total_steps": 125, "loss": 0.5544, "lr": 5.538461538461539e-05, "epoch": 0.35467980295566504, "percentage": 7.2, "elapsed_time": "0:28:53", "remaining_time": "6:12:20"}
{"current_steps": 10, "total_steps": 125, "loss": 0.5503, "lr": 6.153846153846155e-05, "epoch": 0.39408866995073893, "percentage": 8.0, "elapsed_time": "0:32:03", "remaining_time": "6:08:41"}
{"current_steps": 11, "total_steps": 125, "loss": 0.5314, "lr": 6.76923076923077e-05, "epoch": 0.43349753694581283, "percentage": 8.8, "elapsed_time": "0:35:13", "remaining_time": "6:05:03"}
{"current_steps": 12, "total_steps": 125, "loss": 0.5293, "lr": 7.384615384615386e-05, "epoch": 0.4729064039408867, "percentage": 9.6, "elapsed_time": "0:38:23", "remaining_time": "6:01:27"}
{"current_steps": 13, "total_steps": 125, "loss": 0.5197, "lr": 8e-05, "epoch": 0.5123152709359606, "percentage": 10.4, "elapsed_time": "0:41:32", "remaining_time": "5:57:55"}
{"current_steps": 14, "total_steps": 125, "loss": 0.5108, "lr": 7.998426505532213e-05, "epoch": 0.5517241379310345, "percentage": 11.2, "elapsed_time": "0:44:42", "remaining_time": "5:54:29"}
{"current_steps": 15, "total_steps": 125, "loss": 0.5039, "lr": 7.993707260071268e-05, "epoch": 0.5911330049261084, "percentage": 12.0, "elapsed_time": "0:47:52", "remaining_time": "5:51:06"}
{"current_steps": 16, "total_steps": 125, "loss": 0.492, "lr": 7.985845976470478e-05, "epoch": 0.6305418719211823, "percentage": 12.8, "elapsed_time": "0:51:02", "remaining_time": "5:47:43"}
{"current_steps": 17, "total_steps": 125, "loss": 0.4894, "lr": 7.974848839572971e-05, "epoch": 0.6699507389162561, "percentage": 13.6, "elapsed_time": "0:54:12", "remaining_time": "5:44:20"}
{"current_steps": 18, "total_steps": 125, "loss": 0.478, "lr": 7.960724501345783e-05, "epoch": 0.7093596059113301, "percentage": 14.4, "elapsed_time": "0:57:21", "remaining_time": "5:40:58"}
{"current_steps": 19, "total_steps": 125, "loss": 0.4758, "lr": 7.943484074072943e-05, "epoch": 0.7487684729064039, "percentage": 15.2, "elapsed_time": "1:00:32", "remaining_time": "5:37:45"}
{"current_steps": 20, "total_steps": 125, "loss": 0.4755, "lr": 7.923141121612922e-05, "epoch": 0.7881773399014779, "percentage": 16.0, "elapsed_time": "1:03:43", "remaining_time": "5:34:32"}
{"current_steps": 21, "total_steps": 125, "loss": 0.4669, "lr": 7.899711648727294e-05, "epoch": 0.8275862068965517, "percentage": 16.8, "elapsed_time": "1:06:53", "remaining_time": "5:31:18"}
{"current_steps": 22, "total_steps": 125, "loss": 0.4634, "lr": 7.873214088489047e-05, "epoch": 0.8669950738916257, "percentage": 17.6, "elapsed_time": "1:10:03", "remaining_time": "5:28:00"}
{"current_steps": 23, "total_steps": 125, "loss": 0.4539, "lr": 7.843669287780399e-05, "epoch": 0.9064039408866995, "percentage": 18.4, "elapsed_time": "1:13:13", "remaining_time": "5:24:43"}
{"current_steps": 24, "total_steps": 125, "loss": 0.4545, "lr": 7.811100490891586e-05, "epoch": 0.9458128078817734, "percentage": 19.2, "elapsed_time": "1:16:23", "remaining_time": "5:21:27"}
{"current_steps": 25, "total_steps": 125, "loss": 0.4472, "lr": 7.775533321233471e-05, "epoch": 0.9852216748768473, "percentage": 20.0, "elapsed_time": "1:19:32", "remaining_time": "5:18:11"}
{"current_steps": 26, "total_steps": 125, "loss": 0.4415, "lr": 7.736995761178399e-05, "epoch": 1.0344827586206897, "percentage": 20.8, "elapsed_time": "1:27:53", "remaining_time": "5:34:40"}
{"current_steps": 27, "total_steps": 125, "loss": 0.4339, "lr": 7.695518130045147e-05, "epoch": 1.0738916256157636, "percentage": 21.6, "elapsed_time": "1:31:03", "remaining_time": "5:30:29"}
{"current_steps": 28, "total_steps": 125, "loss": 0.4334, "lr": 7.651133060245276e-05, "epoch": 1.1133004926108374, "percentage": 22.4, "elapsed_time": "1:34:12", "remaining_time": "5:26:23"}
{"current_steps": 29, "total_steps": 125, "loss": 0.4306, "lr": 7.603875471609677e-05, "epoch": 1.1527093596059113, "percentage": 23.2, "elapsed_time": "1:37:23", "remaining_time": "5:22:22"}
{"current_steps": 30, "total_steps": 125, "loss": 0.4303, "lr": 7.55378254391549e-05, "epoch": 1.1921182266009853, "percentage": 24.0, "elapsed_time": "1:40:33", "remaining_time": "5:18:24"}
{"current_steps": 31, "total_steps": 125, "loss": 0.4187, "lr": 7.500893687635015e-05, "epoch": 1.2315270935960592, "percentage": 24.8, "elapsed_time": "1:43:42", "remaining_time": "5:14:28"}
{"current_steps": 32, "total_steps": 125, "loss": 0.4163, "lr": 7.445250512929637e-05, "epoch": 1.270935960591133, "percentage": 25.6, "elapsed_time": "1:46:52", "remaining_time": "5:10:36"}
{"current_steps": 33, "total_steps": 125, "loss": 0.4112, "lr": 7.386896796913137e-05, "epoch": 1.3103448275862069, "percentage": 26.4, "elapsed_time": "1:50:02", "remaining_time": "5:06:46"}
{"current_steps": 34, "total_steps": 125, "loss": 0.4167, "lr": 7.325878449210182e-05, "epoch": 1.3497536945812807, "percentage": 27.2, "elapsed_time": "1:53:12", "remaining_time": "5:02:59"}
{"current_steps": 35, "total_steps": 125, "loss": 0.4109, "lr": 7.262243475837041e-05, "epoch": 1.3891625615763548, "percentage": 28.0, "elapsed_time": "1:56:22", "remaining_time": "4:59:14"}
{"current_steps": 36, "total_steps": 125, "loss": 0.4124, "lr": 7.196041941432998e-05, "epoch": 1.4285714285714286, "percentage": 28.8, "elapsed_time": "1:59:32", "remaining_time": "4:55:32"}
{"current_steps": 37, "total_steps": 125, "loss": 0.4056, "lr": 7.12732592987212e-05, "epoch": 1.4679802955665024, "percentage": 29.6, "elapsed_time": "2:02:42", "remaining_time": "4:51:50"}
{"current_steps": 38, "total_steps": 125, "loss": 0.4087, "lr": 7.05614950328643e-05, "epoch": 1.5073891625615765, "percentage": 30.4, "elapsed_time": "2:06:03", "remaining_time": "4:48:35"}
{"current_steps": 39, "total_steps": 125, "loss": 0.412, "lr": 6.982568659532663e-05, "epoch": 1.5467980295566504, "percentage": 31.2, "elapsed_time": "2:09:19", "remaining_time": "4:45:10"}
{"current_steps": 40, "total_steps": 125, "loss": 0.4077, "lr": 6.906641288136109e-05, "epoch": 1.5862068965517242, "percentage": 32.0, "elapsed_time": "2:12:29", "remaining_time": "4:41:32"}
{"current_steps": 41, "total_steps": 125, "loss": 0.4135, "lr": 6.828427124746191e-05, "epoch": 1.625615763546798, "percentage": 32.8, "elapsed_time": "2:15:39", "remaining_time": "4:37:56"}
{"current_steps": 42, "total_steps": 125, "loss": 0.408, "lr": 6.747987704139607e-05, "epoch": 1.6650246305418719, "percentage": 33.6, "elapsed_time": "2:18:49", "remaining_time": "4:34:20"}
{"current_steps": 43, "total_steps": 125, "loss": 0.4125, "lr": 6.665386311808017e-05, "epoch": 1.7044334975369457, "percentage": 34.4, "elapsed_time": "2:21:59", "remaining_time": "4:30:46"}
{"current_steps": 44, "total_steps": 125, "loss": 0.4028, "lr": 6.580687934168352e-05, "epoch": 1.7438423645320196, "percentage": 35.2, "elapsed_time": "2:25:09", "remaining_time": "4:27:13"}
{"current_steps": 45, "total_steps": 125, "loss": 0.403, "lr": 6.493959207434934e-05, "epoch": 1.7832512315270936, "percentage": 36.0, "elapsed_time": "2:28:19", "remaining_time": "4:23:41"}
{"current_steps": 46, "total_steps": 125, "loss": 0.4143, "lr": 6.405268365193624e-05, "epoch": 1.8226600985221675, "percentage": 36.8, "elapsed_time": "2:31:29", "remaining_time": "4:20:09"}
{"current_steps": 47, "total_steps": 125, "loss": 0.3986, "lr": 6.314685184719224e-05, "epoch": 1.8620689655172413, "percentage": 37.6, "elapsed_time": "2:34:38", "remaining_time": "4:16:38"}
{"current_steps": 48, "total_steps": 125, "loss": 0.4034, "lr": 6.22228093207841e-05, "epoch": 1.9014778325123154, "percentage": 38.4, "elapsed_time": "2:37:48", "remaining_time": "4:13:08"}
{"current_steps": 49, "total_steps": 125, "loss": 0.398, "lr": 6.128128306061347e-05, "epoch": 1.9408866995073892, "percentage": 39.2, "elapsed_time": "2:40:58", "remaining_time": "4:09:40"}
{"current_steps": 50, "total_steps": 125, "loss": 0.3946, "lr": 6.0323013809861185e-05, "epoch": 1.980295566502463, "percentage": 40.0, "elapsed_time": "2:44:08", "remaining_time": "4:06:12"}
{"current_steps": 51, "total_steps": 125, "loss": 0.3927, "lr": 5.9348755484209597e-05, "epoch": 2.0295566502463056, "percentage": 40.8, "elapsed_time": "2:50:20", "remaining_time": "4:07:09"}
{"current_steps": 52, "total_steps": 125, "loss": 0.3811, "lr": 5.835927457870151e-05, "epoch": 2.0689655172413794, "percentage": 41.6, "elapsed_time": "2:53:29", "remaining_time": "4:03:33"}
{"current_steps": 53, "total_steps": 125, "loss": 0.3757, "lr": 5.735534956470233e-05, "epoch": 2.1083743842364533, "percentage": 42.4, "elapsed_time": "2:56:39", "remaining_time": "3:59:59"}
{"current_steps": 54, "total_steps": 125, "loss": 0.3818, "lr": 5.6337770277439854e-05, "epoch": 2.147783251231527, "percentage": 43.2, "elapsed_time": "2:59:49", "remaining_time": "3:56:26"}
{"current_steps": 55, "total_steps": 125, "loss": 0.3758, "lr": 5.5307337294603595e-05, "epoch": 2.187192118226601, "percentage": 44.0, "elapsed_time": "3:03:00", "remaining_time": "3:52:55"}
{"current_steps": 56, "total_steps": 125, "loss": 0.3667, "lr": 5.4264861306492525e-05, "epoch": 2.226600985221675, "percentage": 44.8, "elapsed_time": "3:06:10", "remaining_time": "3:49:24"}
{"current_steps": 57, "total_steps": 125, "loss": 0.3711, "lr": 5.321116247820669e-05, "epoch": 2.2660098522167487, "percentage": 45.6, "elapsed_time": "3:09:20", "remaining_time": "3:45:52"}
{"current_steps": 58, "total_steps": 125, "loss": 0.367, "lr": 5.214706980438459e-05, "epoch": 2.3054187192118225, "percentage": 46.4, "elapsed_time": "3:12:33", "remaining_time": "3:42:26"}
{"current_steps": 59, "total_steps": 125, "loss": 0.3651, "lr": 5.107342045699397e-05, "epoch": 2.344827586206897, "percentage": 47.2, "elapsed_time": "3:15:45", "remaining_time": "3:38:58"}
{"current_steps": 60, "total_steps": 125, "loss": 0.3723, "lr": 4.999105912668908e-05, "epoch": 2.3842364532019706, "percentage": 48.0, "elapsed_time": "3:18:55", "remaining_time": "3:35:29"}
{"current_steps": 61, "total_steps": 125, "loss": 0.3696, "lr": 4.890083735825258e-05, "epoch": 2.4236453201970445, "percentage": 48.8, "elapsed_time": "3:22:05", "remaining_time": "3:32:01"}
{"current_steps": 62, "total_steps": 125, "loss": 0.3676, "lr": 4.780361288064514e-05, "epoch": 2.4630541871921183, "percentage": 49.6, "elapsed_time": "3:25:14", "remaining_time": "3:28:33"}
{"current_steps": 63, "total_steps": 125, "loss": 0.3697, "lr": 4.670024893218946e-05, "epoch": 2.502463054187192, "percentage": 50.4, "elapsed_time": "3:28:24", "remaining_time": "3:25:06"}
{"current_steps": 64, "total_steps": 125, "loss": 0.3576, "lr": 4.5591613581419984e-05, "epoch": 2.541871921182266, "percentage": 51.2, "elapsed_time": "3:31:34", "remaining_time": "3:21:39"}
{"current_steps": 65, "total_steps": 125, "loss": 0.3667, "lr": 4.4478579044132314e-05, "epoch": 2.58128078817734, "percentage": 52.0, "elapsed_time": "3:34:44", "remaining_time": "3:18:13"}
{"current_steps": 66, "total_steps": 125, "loss": 0.3658, "lr": 4.336202099716991e-05, "epoch": 2.6206896551724137, "percentage": 52.8, "elapsed_time": "3:37:53", "remaining_time": "3:14:47"}
{"current_steps": 67, "total_steps": 125, "loss": 0.3648, "lr": 4.2242817889487676e-05, "epoch": 2.6600985221674875, "percentage": 53.6, "elapsed_time": "3:41:03", "remaining_time": "3:11:22"}
{"current_steps": 68, "total_steps": 125, "loss": 0.3615, "lr": 4.112185025103476e-05, "epoch": 2.6995073891625614, "percentage": 54.4, "elapsed_time": "3:44:14", "remaining_time": "3:07:57"}
{"current_steps": 69, "total_steps": 125, "loss": 0.3663, "lr": 4e-05, "epoch": 2.7389162561576352, "percentage": 55.2, "elapsed_time": "3:47:27", "remaining_time": "3:04:36"}
{"current_steps": 70, "total_steps": 125, "loss": 0.3606, "lr": 3.8878149748965245e-05, "epoch": 2.7783251231527095, "percentage": 56.0, "elapsed_time": "3:50:37", "remaining_time": "3:01:12"}
{"current_steps": 71, "total_steps": 125, "loss": 0.3667, "lr": 3.775718211051233e-05, "epoch": 2.8177339901477834, "percentage": 56.8, "elapsed_time": "3:53:47", "remaining_time": "2:57:48"}
{"current_steps": 72, "total_steps": 125, "loss": 0.3691, "lr": 3.6637979002830106e-05, "epoch": 2.857142857142857, "percentage": 57.6, "elapsed_time": "3:56:57", "remaining_time": "2:54:25"}
{"current_steps": 73, "total_steps": 125, "loss": 0.3664, "lr": 3.552142095586769e-05, "epoch": 2.896551724137931, "percentage": 58.4, "elapsed_time": "4:00:07", "remaining_time": "2:51:03"}
{"current_steps": 74, "total_steps": 125, "loss": 0.3717, "lr": 3.4408386418580036e-05, "epoch": 2.935960591133005, "percentage": 59.2, "elapsed_time": "4:03:18", "remaining_time": "2:47:40"}
{"current_steps": 75, "total_steps": 125, "loss": 0.358, "lr": 3.329975106781055e-05, "epoch": 2.9753694581280787, "percentage": 60.0, "elapsed_time": "4:06:28", "remaining_time": "2:44:18"}
{"current_steps": 76, "total_steps": 125, "loss": 0.3487, "lr": 3.219638711935488e-05, "epoch": 3.0246305418719213, "percentage": 60.8, "elapsed_time": "4:12:41", "remaining_time": "2:42:54"}
{"current_steps": 77, "total_steps": 125, "loss": 0.3378, "lr": 3.109916264174743e-05, "epoch": 3.064039408866995, "percentage": 61.6, "elapsed_time": "4:15:50", "remaining_time": "2:39:29"}
{"current_steps": 78, "total_steps": 125, "loss": 0.3471, "lr": 3.000894087331092e-05, "epoch": 3.103448275862069, "percentage": 62.4, "elapsed_time": "4:19:03", "remaining_time": "2:36:06"}
{"current_steps": 79, "total_steps": 125, "loss": 0.345, "lr": 2.892657954300603e-05, "epoch": 3.142857142857143, "percentage": 63.2, "elapsed_time": "4:22:17", "remaining_time": "2:32:43"}
{"current_steps": 80, "total_steps": 125, "loss": 0.3423, "lr": 2.7852930195615413e-05, "epoch": 3.1822660098522166, "percentage": 64.0, "elapsed_time": "4:25:28", "remaining_time": "2:29:19"}
{"current_steps": 81, "total_steps": 125, "loss": 0.3375, "lr": 2.678883752179333e-05, "epoch": 3.2216748768472905, "percentage": 64.8, "elapsed_time": "4:28:38", "remaining_time": "2:25:55"}
{"current_steps": 82, "total_steps": 125, "loss": 0.3449, "lr": 2.573513869350748e-05, "epoch": 3.2610837438423648, "percentage": 65.6, "elapsed_time": "4:31:49", "remaining_time": "2:22:32"}
{"current_steps": 83, "total_steps": 125, "loss": 0.3477, "lr": 2.4692662705396412e-05, "epoch": 3.3004926108374386, "percentage": 66.4, "elapsed_time": "4:34:59", "remaining_time": "2:19:09"}
{"current_steps": 84, "total_steps": 125, "loss": 0.3393, "lr": 2.366222972256016e-05, "epoch": 3.3399014778325125, "percentage": 67.2, "elapsed_time": "4:38:13", "remaining_time": "2:15:47"}
{"current_steps": 85, "total_steps": 125, "loss": 0.3386, "lr": 2.264465043529768e-05, "epoch": 3.3793103448275863, "percentage": 68.0, "elapsed_time": "4:41:23", "remaining_time": "2:12:25"}
{"current_steps": 86, "total_steps": 125, "loss": 0.3413, "lr": 2.1640725421298487e-05, "epoch": 3.41871921182266, "percentage": 68.8, "elapsed_time": "4:44:33", "remaining_time": "2:09:02"}
{"current_steps": 87, "total_steps": 125, "loss": 0.3415, "lr": 2.065124451579041e-05, "epoch": 3.458128078817734, "percentage": 69.6, "elapsed_time": "4:47:43", "remaining_time": "2:05:40"}
{"current_steps": 88, "total_steps": 125, "loss": 0.3424, "lr": 1.9676986190138835e-05, "epoch": 3.497536945812808, "percentage": 70.4, "elapsed_time": "4:50:53", "remaining_time": "2:02:18"}
{"current_steps": 89, "total_steps": 125, "loss": 0.3438, "lr": 1.8718716939386543e-05, "epoch": 3.5369458128078817, "percentage": 71.2, "elapsed_time": "4:54:04", "remaining_time": "1:58:57"}
{"current_steps": 90, "total_steps": 125, "loss": 0.3413, "lr": 1.7777190679215923e-05, "epoch": 3.5763546798029555, "percentage": 72.0, "elapsed_time": "4:57:14", "remaining_time": "1:55:35"}
{"current_steps": 91, "total_steps": 125, "loss": 0.3394, "lr": 1.6853148152807774e-05, "epoch": 3.6157635467980294, "percentage": 72.8, "elapsed_time": "5:00:24", "remaining_time": "1:52:14"}
{"current_steps": 92, "total_steps": 125, "loss": 0.3452, "lr": 1.5947316348063764e-05, "epoch": 3.655172413793103, "percentage": 73.6, "elapsed_time": "5:03:39", "remaining_time": "1:48:55"}
{"current_steps": 93, "total_steps": 125, "loss": 0.3386, "lr": 1.5060407925650662e-05, "epoch": 3.6945812807881775, "percentage": 74.4, "elapsed_time": "5:06:48", "remaining_time": "1:45:34"}
{"current_steps": 94, "total_steps": 125, "loss": 0.3384, "lr": 1.4193120658316506e-05, "epoch": 3.7339901477832513, "percentage": 75.2, "elapsed_time": "5:09:59", "remaining_time": "1:42:13"}
{"current_steps": 95, "total_steps": 125, "loss": 0.3423, "lr": 1.3346136881919845e-05, "epoch": 3.773399014778325, "percentage": 76.0, "elapsed_time": "5:13:09", "remaining_time": "1:38:53"}
{"current_steps": 96, "total_steps": 125, "loss": 0.3394, "lr": 1.2520122958603933e-05, "epoch": 3.812807881773399, "percentage": 76.8, "elapsed_time": "5:16:19", "remaining_time": "1:35:33"}
{"current_steps": 97, "total_steps": 125, "loss": 0.3377, "lr": 1.1715728752538103e-05, "epoch": 3.852216748768473, "percentage": 77.6, "elapsed_time": "5:19:29", "remaining_time": "1:32:13"}
{"current_steps": 98, "total_steps": 125, "loss": 0.3389, "lr": 1.0933587118638927e-05, "epoch": 3.8916256157635467, "percentage": 78.4, "elapsed_time": "5:22:45", "remaining_time": "1:28:55"}
{"current_steps": 99, "total_steps": 125, "loss": 0.3386, "lr": 1.0174313404673378e-05, "epoch": 3.9310344827586206, "percentage": 79.2, "elapsed_time": "5:25:59", "remaining_time": "1:25:36"}
{"current_steps": 100, "total_steps": 125, "loss": 0.3435, "lr": 9.438504967135703e-06, "epoch": 3.970443349753695, "percentage": 80.0, "elapsed_time": "5:29:09", "remaining_time": "1:22:17"}
{"current_steps": 101, "total_steps": 125, "loss": 0.3299, "lr": 8.72674070127881e-06, "epoch": 4.019704433497537, "percentage": 80.8, "elapsed_time": "5:35:27", "remaining_time": "1:19:42"}
{"current_steps": 102, "total_steps": 125, "loss": 0.3271, "lr": 8.039580585670047e-06, "epoch": 4.059113300492611, "percentage": 81.6, "elapsed_time": "5:38:37", "remaining_time": "1:16:21"}
{"current_steps": 103, "total_steps": 125, "loss": 0.3298, "lr": 7.3775652416295936e-06, "epoch": 4.098522167487685, "percentage": 82.4, "elapsed_time": "5:41:46", "remaining_time": "1:13:00"}
{"current_steps": 104, "total_steps": 125, "loss": 0.3295, "lr": 6.7412155078981865e-06, "epoch": 4.137931034482759, "percentage": 83.2, "elapsed_time": "5:45:00", "remaining_time": "1:09:39"}
{"current_steps": 105, "total_steps": 125, "loss": 0.3274, "lr": 6.1310320308686354e-06, "epoch": 4.177339901477833, "percentage": 84.0, "elapsed_time": "5:48:11", "remaining_time": "1:06:19"}
{"current_steps": 106, "total_steps": 125, "loss": 0.3307, "lr": 5.547494870703642e-06, "epoch": 4.216748768472907, "percentage": 84.8, "elapsed_time": "5:51:21", "remaining_time": "1:02:58"}
{"current_steps": 107, "total_steps": 125, "loss": 0.326, "lr": 4.991063123649853e-06, "epoch": 4.25615763546798, "percentage": 85.6, "elapsed_time": "5:54:31", "remaining_time": "0:59:38"}
{"current_steps": 108, "total_steps": 125, "loss": 0.3273, "lr": 4.462174560845114e-06, "epoch": 4.295566502463054, "percentage": 86.4, "elapsed_time": "5:57:42", "remaining_time": "0:56:18"}
{"current_steps": 109, "total_steps": 125, "loss": 0.3304, "lr": 3.961245283903239e-06, "epoch": 4.334975369458128, "percentage": 87.2, "elapsed_time": "6:00:52", "remaining_time": "0:52:58"}
{"current_steps": 110, "total_steps": 125, "loss": 0.3285, "lr": 3.4886693975472443e-06, "epoch": 4.374384236453202, "percentage": 88.0, "elapsed_time": "6:04:03", "remaining_time": "0:49:38"}
{"current_steps": 111, "total_steps": 125, "loss": 0.328, "lr": 3.0448186995485307e-06, "epoch": 4.413793103448276, "percentage": 88.8, "elapsed_time": "6:07:13", "remaining_time": "0:46:19"}
{"current_steps": 112, "total_steps": 125, "loss": 0.3314, "lr": 2.630042388216012e-06, "epoch": 4.45320197044335, "percentage": 89.6, "elapsed_time": "6:10:23", "remaining_time": "0:42:59"}
{"current_steps": 113, "total_steps": 125, "loss": 0.3285, "lr": 2.244666787665297e-06, "epoch": 4.4926108374384235, "percentage": 90.4, "elapsed_time": "6:13:33", "remaining_time": "0:39:40"}
{"current_steps": 114, "total_steps": 125, "loss": 0.3267, "lr": 1.888995091084147e-06, "epoch": 4.532019704433497, "percentage": 91.2, "elapsed_time": "6:16:45", "remaining_time": "0:36:21"}
{"current_steps": 115, "total_steps": 125, "loss": 0.3199, "lr": 1.5633071221960205e-06, "epoch": 4.571428571428571, "percentage": 92.0, "elapsed_time": "6:19:55", "remaining_time": "0:33:02"}
{"current_steps": 116, "total_steps": 125, "loss": 0.3291, "lr": 1.2678591151095466e-06, "epoch": 4.610837438423645, "percentage": 92.8, "elapsed_time": "6:23:05", "remaining_time": "0:29:43"}
{"current_steps": 117, "total_steps": 125, "loss": 0.328, "lr": 1.0028835127270553e-06, "epoch": 4.650246305418719, "percentage": 93.6, "elapsed_time": "6:26:14", "remaining_time": "0:26:24"}
{"current_steps": 118, "total_steps": 125, "loss": 0.3282, "lr": 7.685887838707828e-07, "epoch": 4.689655172413794, "percentage": 94.4, "elapsed_time": "6:29:25", "remaining_time": "0:23:06"}
{"current_steps": 119, "total_steps": 125, "loss": 0.3358, "lr": 5.651592592705646e-07, "epoch": 4.7290640394088665, "percentage": 95.2, "elapsed_time": "6:32:35", "remaining_time": "0:19:47"}
{"current_steps": 120, "total_steps": 125, "loss": 0.3231, "lr": 3.9275498654217425e-07, "epoch": 4.768472906403941, "percentage": 96.0, "elapsed_time": "6:35:48", "remaining_time": "0:16:29"}
{"current_steps": 121, "total_steps": 125, "loss": 0.3273, "lr": 2.5151160427029584e-07, "epoch": 4.807881773399015, "percentage": 96.8, "elapsed_time": "6:38:58", "remaining_time": "0:13:11"}
{"current_steps": 122, "total_steps": 125, "loss": 0.3252, "lr": 1.4154023529523663e-07, "epoch": 4.847290640394089, "percentage": 97.6, "elapsed_time": "6:42:08", "remaining_time": "0:09:53"}
{"current_steps": 123, "total_steps": 125, "loss": 0.3251, "lr": 6.292739928733582e-08, "epoch": 4.886699507389163, "percentage": 98.4, "elapsed_time": "6:45:19", "remaining_time": "0:06:35"}
{"current_steps": 124, "total_steps": 125, "loss": 0.3261, "lr": 1.5734944677885388e-08, "epoch": 4.926108374384237, "percentage": 99.2, "elapsed_time": "6:48:29", "remaining_time": "0:03:17"}
{"current_steps": 125, "total_steps": 125, "loss": 0.3278, "lr": 0.0, "epoch": 4.9655172413793105, "percentage": 100.0, "elapsed_time": "6:51:39", "remaining_time": "0:00:00"}
{"current_steps": 125, "total_steps": 125, "epoch": 4.9655172413793105, "percentage": 100.0, "elapsed_time": "6:56:37", "remaining_time": "0:00:00"}