new111 / trainer_log.jsonl
zhang9302002's picture
Upload folder using huggingface_hub
11c3233 verified
{"current_steps": 1, "total_steps": 980, "loss": 2.7414, "lr": 0.0, "epoch": 0.03571428571428571, "percentage": 0.1, "elapsed_time": "0:00:03", "remaining_time": "1:03:21"}
{"current_steps": 2, "total_steps": 980, "loss": 2.532, "lr": 1.0204081632653061e-07, "epoch": 0.07142857142857142, "percentage": 0.2, "elapsed_time": "0:00:07", "remaining_time": "1:02:25"}
{"current_steps": 3, "total_steps": 980, "loss": 2.439, "lr": 2.0408163265306121e-07, "epoch": 0.10714285714285714, "percentage": 0.31, "elapsed_time": "0:00:11", "remaining_time": "1:02:06"}
{"current_steps": 4, "total_steps": 980, "loss": 2.5109, "lr": 3.0612244897959183e-07, "epoch": 0.14285714285714285, "percentage": 0.41, "elapsed_time": "0:00:15", "remaining_time": "1:03:36"}
{"current_steps": 5, "total_steps": 980, "loss": 2.5067, "lr": 4.0816326530612243e-07, "epoch": 0.17857142857142858, "percentage": 0.51, "elapsed_time": "0:00:19", "remaining_time": "1:04:29"}
{"current_steps": 6, "total_steps": 980, "loss": 2.6609, "lr": 5.102040816326531e-07, "epoch": 0.21428571428571427, "percentage": 0.61, "elapsed_time": "0:00:23", "remaining_time": "1:02:41"}
{"current_steps": 7, "total_steps": 980, "loss": 2.5307, "lr": 6.122448979591837e-07, "epoch": 0.25, "percentage": 0.71, "elapsed_time": "0:00:27", "remaining_time": "1:03:24"}
{"current_steps": 8, "total_steps": 980, "loss": 2.6476, "lr": 7.142857142857143e-07, "epoch": 0.2857142857142857, "percentage": 0.82, "elapsed_time": "0:00:31", "remaining_time": "1:03:55"}
{"current_steps": 9, "total_steps": 980, "loss": 2.5897, "lr": 8.163265306122449e-07, "epoch": 0.32142857142857145, "percentage": 0.92, "elapsed_time": "0:00:35", "remaining_time": "1:04:16"}
{"current_steps": 10, "total_steps": 980, "loss": 2.5036, "lr": 9.183673469387756e-07, "epoch": 0.35714285714285715, "percentage": 1.02, "elapsed_time": "0:00:39", "remaining_time": "1:04:07"}
{"current_steps": 11, "total_steps": 980, "loss": 2.3625, "lr": 1.0204081632653063e-06, "epoch": 0.39285714285714285, "percentage": 1.12, "elapsed_time": "0:00:42", "remaining_time": "1:03:05"}
{"current_steps": 12, "total_steps": 980, "loss": 2.3566, "lr": 1.122448979591837e-06, "epoch": 0.42857142857142855, "percentage": 1.22, "elapsed_time": "0:00:46", "remaining_time": "1:02:24"}
{"current_steps": 13, "total_steps": 980, "loss": 2.3067, "lr": 1.2244897959183673e-06, "epoch": 0.4642857142857143, "percentage": 1.33, "elapsed_time": "0:00:50", "remaining_time": "1:02:29"}
{"current_steps": 14, "total_steps": 980, "loss": 2.4596, "lr": 1.3265306122448982e-06, "epoch": 0.5, "percentage": 1.43, "elapsed_time": "0:00:53", "remaining_time": "1:02:04"}
{"current_steps": 15, "total_steps": 980, "loss": 2.4559, "lr": 1.4285714285714286e-06, "epoch": 0.5357142857142857, "percentage": 1.53, "elapsed_time": "0:00:58", "remaining_time": "1:02:21"}
{"current_steps": 16, "total_steps": 980, "loss": 2.2781, "lr": 1.5306122448979593e-06, "epoch": 0.5714285714285714, "percentage": 1.63, "elapsed_time": "0:01:03", "remaining_time": "1:03:26"}
{"current_steps": 17, "total_steps": 980, "loss": 2.3636, "lr": 1.6326530612244897e-06, "epoch": 0.6071428571428571, "percentage": 1.73, "elapsed_time": "0:01:06", "remaining_time": "1:02:42"}
{"current_steps": 18, "total_steps": 980, "loss": 2.4038, "lr": 1.7346938775510206e-06, "epoch": 0.6428571428571429, "percentage": 1.84, "elapsed_time": "0:01:09", "remaining_time": "1:02:06"}
{"current_steps": 19, "total_steps": 980, "loss": 2.2931, "lr": 1.8367346938775512e-06, "epoch": 0.6785714285714286, "percentage": 1.94, "elapsed_time": "0:01:13", "remaining_time": "1:01:57"}
{"current_steps": 20, "total_steps": 980, "loss": 2.0346, "lr": 1.938775510204082e-06, "epoch": 0.7142857142857143, "percentage": 2.04, "elapsed_time": "0:01:17", "remaining_time": "1:01:49"}
{"current_steps": 21, "total_steps": 980, "loss": 2.2192, "lr": 2.0408163265306125e-06, "epoch": 0.75, "percentage": 2.14, "elapsed_time": "0:01:21", "remaining_time": "1:02:00"}
{"current_steps": 22, "total_steps": 980, "loss": 2.1561, "lr": 2.1428571428571427e-06, "epoch": 0.7857142857142857, "percentage": 2.24, "elapsed_time": "0:01:24", "remaining_time": "1:01:32"}
{"current_steps": 23, "total_steps": 980, "loss": 2.2667, "lr": 2.244897959183674e-06, "epoch": 0.8214285714285714, "percentage": 2.35, "elapsed_time": "0:01:28", "remaining_time": "1:01:04"}
{"current_steps": 24, "total_steps": 980, "loss": 2.0838, "lr": 2.3469387755102044e-06, "epoch": 0.8571428571428571, "percentage": 2.45, "elapsed_time": "0:01:31", "remaining_time": "1:00:43"}
{"current_steps": 25, "total_steps": 980, "loss": 2.102, "lr": 2.4489795918367347e-06, "epoch": 0.8928571428571429, "percentage": 2.55, "elapsed_time": "0:01:34", "remaining_time": "1:00:21"}
{"current_steps": 26, "total_steps": 980, "loss": 2.0475, "lr": 2.5510204081632657e-06, "epoch": 0.9285714285714286, "percentage": 2.65, "elapsed_time": "0:01:37", "remaining_time": "0:59:55"}
{"current_steps": 27, "total_steps": 980, "loss": 2.0281, "lr": 2.6530612244897964e-06, "epoch": 0.9642857142857143, "percentage": 2.76, "elapsed_time": "0:01:41", "remaining_time": "0:59:44"}
{"current_steps": 28, "total_steps": 980, "loss": 2.019, "lr": 2.7551020408163266e-06, "epoch": 1.0, "percentage": 2.86, "elapsed_time": "0:01:45", "remaining_time": "0:59:40"}
{"current_steps": 29, "total_steps": 980, "loss": 1.9081, "lr": 2.8571428571428573e-06, "epoch": 1.0357142857142858, "percentage": 2.96, "elapsed_time": "0:01:49", "remaining_time": "0:59:51"}
{"current_steps": 30, "total_steps": 980, "loss": 1.9358, "lr": 2.959183673469388e-06, "epoch": 1.0714285714285714, "percentage": 3.06, "elapsed_time": "0:01:53", "remaining_time": "1:00:00"}
{"current_steps": 31, "total_steps": 980, "loss": 1.9145, "lr": 3.0612244897959185e-06, "epoch": 1.1071428571428572, "percentage": 3.16, "elapsed_time": "0:01:58", "remaining_time": "1:00:32"}
{"current_steps": 32, "total_steps": 980, "loss": 1.7714, "lr": 3.1632653061224496e-06, "epoch": 1.1428571428571428, "percentage": 3.27, "elapsed_time": "0:02:02", "remaining_time": "1:00:14"}
{"current_steps": 33, "total_steps": 980, "loss": 1.7249, "lr": 3.2653061224489794e-06, "epoch": 1.1785714285714286, "percentage": 3.37, "elapsed_time": "0:02:06", "remaining_time": "1:00:22"}
{"current_steps": 34, "total_steps": 980, "loss": 1.7585, "lr": 3.3673469387755105e-06, "epoch": 1.2142857142857142, "percentage": 3.47, "elapsed_time": "0:02:09", "remaining_time": "1:00:04"}
{"current_steps": 35, "total_steps": 980, "loss": 1.5646, "lr": 3.469387755102041e-06, "epoch": 1.25, "percentage": 3.57, "elapsed_time": "0:02:13", "remaining_time": "1:00:05"}
{"current_steps": 36, "total_steps": 980, "loss": 1.6348, "lr": 3.5714285714285718e-06, "epoch": 1.2857142857142856, "percentage": 3.67, "elapsed_time": "0:02:16", "remaining_time": "0:59:47"}
{"current_steps": 37, "total_steps": 980, "loss": 1.7431, "lr": 3.6734693877551024e-06, "epoch": 1.3214285714285714, "percentage": 3.78, "elapsed_time": "0:02:20", "remaining_time": "0:59:29"}
{"current_steps": 38, "total_steps": 980, "loss": 1.7093, "lr": 3.7755102040816327e-06, "epoch": 1.3571428571428572, "percentage": 3.88, "elapsed_time": "0:02:24", "remaining_time": "0:59:35"}
{"current_steps": 39, "total_steps": 980, "loss": 1.7049, "lr": 3.877551020408164e-06, "epoch": 1.3928571428571428, "percentage": 3.98, "elapsed_time": "0:02:27", "remaining_time": "0:59:18"}
{"current_steps": 40, "total_steps": 980, "loss": 1.6828, "lr": 3.979591836734694e-06, "epoch": 1.4285714285714286, "percentage": 4.08, "elapsed_time": "0:02:30", "remaining_time": "0:59:05"}
{"current_steps": 41, "total_steps": 980, "loss": 1.6261, "lr": 4.081632653061225e-06, "epoch": 1.4642857142857144, "percentage": 4.18, "elapsed_time": "0:02:34", "remaining_time": "0:58:58"}
{"current_steps": 42, "total_steps": 980, "loss": 1.6354, "lr": 4.183673469387755e-06, "epoch": 1.5, "percentage": 4.29, "elapsed_time": "0:02:37", "remaining_time": "0:58:45"}
{"current_steps": 43, "total_steps": 980, "loss": 1.7451, "lr": 4.2857142857142855e-06, "epoch": 1.5357142857142856, "percentage": 4.39, "elapsed_time": "0:02:41", "remaining_time": "0:58:30"}
{"current_steps": 44, "total_steps": 980, "loss": 1.5587, "lr": 4.3877551020408165e-06, "epoch": 1.5714285714285714, "percentage": 4.49, "elapsed_time": "0:02:44", "remaining_time": "0:58:19"}
{"current_steps": 45, "total_steps": 980, "loss": 1.6485, "lr": 4.489795918367348e-06, "epoch": 1.6071428571428572, "percentage": 4.59, "elapsed_time": "0:02:47", "remaining_time": "0:58:04"}
{"current_steps": 46, "total_steps": 980, "loss": 1.5298, "lr": 4.591836734693878e-06, "epoch": 1.6428571428571428, "percentage": 4.69, "elapsed_time": "0:02:51", "remaining_time": "0:58:02"}
{"current_steps": 47, "total_steps": 980, "loss": 1.5205, "lr": 4.693877551020409e-06, "epoch": 1.6785714285714286, "percentage": 4.8, "elapsed_time": "0:02:55", "remaining_time": "0:58:01"}
{"current_steps": 48, "total_steps": 980, "loss": 1.4686, "lr": 4.795918367346939e-06, "epoch": 1.7142857142857144, "percentage": 4.9, "elapsed_time": "0:02:58", "remaining_time": "0:57:46"}
{"current_steps": 49, "total_steps": 980, "loss": 1.5902, "lr": 4.897959183673469e-06, "epoch": 1.75, "percentage": 5.0, "elapsed_time": "0:03:02", "remaining_time": "0:57:42"}
{"current_steps": 50, "total_steps": 980, "loss": 1.513, "lr": 5e-06, "epoch": 1.7857142857142856, "percentage": 5.1, "elapsed_time": "0:03:05", "remaining_time": "0:57:39"}
{"current_steps": 51, "total_steps": 980, "loss": 1.5964, "lr": 5.1020408163265315e-06, "epoch": 1.8214285714285714, "percentage": 5.2, "elapsed_time": "0:03:10", "remaining_time": "0:57:45"}
{"current_steps": 52, "total_steps": 980, "loss": 1.4724, "lr": 5.204081632653062e-06, "epoch": 1.8571428571428572, "percentage": 5.31, "elapsed_time": "0:03:13", "remaining_time": "0:57:35"}
{"current_steps": 53, "total_steps": 980, "loss": 1.589, "lr": 5.306122448979593e-06, "epoch": 1.8928571428571428, "percentage": 5.41, "elapsed_time": "0:03:17", "remaining_time": "0:57:39"}
{"current_steps": 54, "total_steps": 980, "loss": 1.5026, "lr": 5.408163265306123e-06, "epoch": 1.9285714285714286, "percentage": 5.51, "elapsed_time": "0:03:21", "remaining_time": "0:57:36"}
{"current_steps": 55, "total_steps": 980, "loss": 1.5709, "lr": 5.510204081632653e-06, "epoch": 1.9642857142857144, "percentage": 5.61, "elapsed_time": "0:03:25", "remaining_time": "0:57:27"}
{"current_steps": 56, "total_steps": 980, "loss": 1.528, "lr": 5.6122448979591834e-06, "epoch": 2.0, "percentage": 5.71, "elapsed_time": "0:03:29", "remaining_time": "0:57:33"}
{"current_steps": 57, "total_steps": 980, "loss": 1.5065, "lr": 5.7142857142857145e-06, "epoch": 2.0357142857142856, "percentage": 5.82, "elapsed_time": "0:03:32", "remaining_time": "0:57:25"}
{"current_steps": 58, "total_steps": 980, "loss": 1.5931, "lr": 5.816326530612246e-06, "epoch": 2.0714285714285716, "percentage": 5.92, "elapsed_time": "0:03:36", "remaining_time": "0:57:14"}
{"current_steps": 59, "total_steps": 980, "loss": 1.5268, "lr": 5.918367346938776e-06, "epoch": 2.107142857142857, "percentage": 6.02, "elapsed_time": "0:03:39", "remaining_time": "0:57:02"}
{"current_steps": 60, "total_steps": 980, "loss": 1.4429, "lr": 6.020408163265307e-06, "epoch": 2.142857142857143, "percentage": 6.12, "elapsed_time": "0:03:43", "remaining_time": "0:57:02"}
{"current_steps": 61, "total_steps": 980, "loss": 1.4426, "lr": 6.122448979591837e-06, "epoch": 2.1785714285714284, "percentage": 6.22, "elapsed_time": "0:03:47", "remaining_time": "0:57:00"}
{"current_steps": 62, "total_steps": 980, "loss": 1.4092, "lr": 6.224489795918368e-06, "epoch": 2.2142857142857144, "percentage": 6.33, "elapsed_time": "0:03:50", "remaining_time": "0:56:49"}
{"current_steps": 63, "total_steps": 980, "loss": 1.4018, "lr": 6.326530612244899e-06, "epoch": 2.25, "percentage": 6.43, "elapsed_time": "0:03:53", "remaining_time": "0:56:39"}
{"current_steps": 64, "total_steps": 980, "loss": 1.3959, "lr": 6.4285714285714295e-06, "epoch": 2.2857142857142856, "percentage": 6.53, "elapsed_time": "0:03:57", "remaining_time": "0:56:32"}
{"current_steps": 65, "total_steps": 980, "loss": 1.3596, "lr": 6.530612244897959e-06, "epoch": 2.3214285714285716, "percentage": 6.63, "elapsed_time": "0:04:01", "remaining_time": "0:56:36"}
{"current_steps": 66, "total_steps": 980, "loss": 1.4646, "lr": 6.63265306122449e-06, "epoch": 2.357142857142857, "percentage": 6.73, "elapsed_time": "0:04:04", "remaining_time": "0:56:25"}
{"current_steps": 67, "total_steps": 980, "loss": 1.4945, "lr": 6.734693877551021e-06, "epoch": 2.392857142857143, "percentage": 6.84, "elapsed_time": "0:04:08", "remaining_time": "0:56:30"}
{"current_steps": 68, "total_steps": 980, "loss": 1.3554, "lr": 6.836734693877551e-06, "epoch": 2.4285714285714284, "percentage": 6.94, "elapsed_time": "0:04:12", "remaining_time": "0:56:32"}
{"current_steps": 69, "total_steps": 980, "loss": 1.3483, "lr": 6.938775510204082e-06, "epoch": 2.4642857142857144, "percentage": 7.04, "elapsed_time": "0:04:16", "remaining_time": "0:56:29"}
{"current_steps": 70, "total_steps": 980, "loss": 1.3678, "lr": 7.0408163265306125e-06, "epoch": 2.5, "percentage": 7.14, "elapsed_time": "0:04:19", "remaining_time": "0:56:19"}
{"current_steps": 71, "total_steps": 980, "loss": 1.4009, "lr": 7.1428571428571436e-06, "epoch": 2.5357142857142856, "percentage": 7.24, "elapsed_time": "0:04:24", "remaining_time": "0:56:22"}
{"current_steps": 72, "total_steps": 980, "loss": 1.3519, "lr": 7.244897959183675e-06, "epoch": 2.571428571428571, "percentage": 7.35, "elapsed_time": "0:04:28", "remaining_time": "0:56:20"}
{"current_steps": 73, "total_steps": 980, "loss": 1.4351, "lr": 7.346938775510205e-06, "epoch": 2.607142857142857, "percentage": 7.45, "elapsed_time": "0:04:32", "remaining_time": "0:56:26"}
{"current_steps": 74, "total_steps": 980, "loss": 1.4096, "lr": 7.448979591836736e-06, "epoch": 2.642857142857143, "percentage": 7.55, "elapsed_time": "0:04:35", "remaining_time": "0:56:16"}
{"current_steps": 75, "total_steps": 980, "loss": 1.4303, "lr": 7.551020408163265e-06, "epoch": 2.678571428571429, "percentage": 7.65, "elapsed_time": "0:04:39", "remaining_time": "0:56:15"}
{"current_steps": 76, "total_steps": 980, "loss": 1.2549, "lr": 7.653061224489796e-06, "epoch": 2.7142857142857144, "percentage": 7.76, "elapsed_time": "0:04:43", "remaining_time": "0:56:12"}
{"current_steps": 77, "total_steps": 980, "loss": 1.303, "lr": 7.755102040816327e-06, "epoch": 2.75, "percentage": 7.86, "elapsed_time": "0:04:47", "remaining_time": "0:56:13"}
{"current_steps": 78, "total_steps": 980, "loss": 1.3732, "lr": 7.857142857142858e-06, "epoch": 2.7857142857142856, "percentage": 7.96, "elapsed_time": "0:04:51", "remaining_time": "0:56:15"}
{"current_steps": 79, "total_steps": 980, "loss": 1.4765, "lr": 7.959183673469388e-06, "epoch": 2.821428571428571, "percentage": 8.06, "elapsed_time": "0:04:55", "remaining_time": "0:56:05"}
{"current_steps": 80, "total_steps": 980, "loss": 1.3302, "lr": 8.06122448979592e-06, "epoch": 2.857142857142857, "percentage": 8.16, "elapsed_time": "0:04:58", "remaining_time": "0:56:03"}
{"current_steps": 81, "total_steps": 980, "loss": 1.3691, "lr": 8.16326530612245e-06, "epoch": 2.892857142857143, "percentage": 8.27, "elapsed_time": "0:05:02", "remaining_time": "0:55:56"}
{"current_steps": 82, "total_steps": 980, "loss": 1.3872, "lr": 8.26530612244898e-06, "epoch": 2.928571428571429, "percentage": 8.37, "elapsed_time": "0:05:05", "remaining_time": "0:55:48"}
{"current_steps": 83, "total_steps": 980, "loss": 1.3095, "lr": 8.36734693877551e-06, "epoch": 2.9642857142857144, "percentage": 8.47, "elapsed_time": "0:05:08", "remaining_time": "0:55:38"}
{"current_steps": 84, "total_steps": 980, "loss": 1.3005, "lr": 8.469387755102042e-06, "epoch": 3.0, "percentage": 8.57, "elapsed_time": "0:05:12", "remaining_time": "0:55:32"}
{"current_steps": 85, "total_steps": 980, "loss": 1.3534, "lr": 8.571428571428571e-06, "epoch": 3.0357142857142856, "percentage": 8.67, "elapsed_time": "0:05:16", "remaining_time": "0:55:27"}
{"current_steps": 86, "total_steps": 980, "loss": 1.2637, "lr": 8.673469387755103e-06, "epoch": 3.0714285714285716, "percentage": 8.78, "elapsed_time": "0:05:20", "remaining_time": "0:55:28"}
{"current_steps": 87, "total_steps": 980, "loss": 1.2964, "lr": 8.775510204081633e-06, "epoch": 3.107142857142857, "percentage": 8.88, "elapsed_time": "0:05:23", "remaining_time": "0:55:19"}
{"current_steps": 88, "total_steps": 980, "loss": 1.26, "lr": 8.877551020408163e-06, "epoch": 3.142857142857143, "percentage": 8.98, "elapsed_time": "0:05:27", "remaining_time": "0:55:16"}
{"current_steps": 89, "total_steps": 980, "loss": 1.2085, "lr": 8.979591836734695e-06, "epoch": 3.1785714285714284, "percentage": 9.08, "elapsed_time": "0:05:31", "remaining_time": "0:55:14"}
{"current_steps": 90, "total_steps": 980, "loss": 1.313, "lr": 9.081632653061225e-06, "epoch": 3.2142857142857144, "percentage": 9.18, "elapsed_time": "0:05:34", "remaining_time": "0:55:06"}
{"current_steps": 91, "total_steps": 980, "loss": 1.2019, "lr": 9.183673469387756e-06, "epoch": 3.25, "percentage": 9.29, "elapsed_time": "0:05:37", "remaining_time": "0:55:00"}
{"current_steps": 92, "total_steps": 980, "loss": 1.2688, "lr": 9.285714285714288e-06, "epoch": 3.2857142857142856, "percentage": 9.39, "elapsed_time": "0:05:42", "remaining_time": "0:55:01"}
{"current_steps": 93, "total_steps": 980, "loss": 1.2488, "lr": 9.387755102040818e-06, "epoch": 3.3214285714285716, "percentage": 9.49, "elapsed_time": "0:05:45", "remaining_time": "0:54:58"}
{"current_steps": 94, "total_steps": 980, "loss": 1.1932, "lr": 9.489795918367348e-06, "epoch": 3.357142857142857, "percentage": 9.59, "elapsed_time": "0:05:49", "remaining_time": "0:54:55"}
{"current_steps": 95, "total_steps": 980, "loss": 1.2833, "lr": 9.591836734693878e-06, "epoch": 3.392857142857143, "percentage": 9.69, "elapsed_time": "0:05:52", "remaining_time": "0:54:48"}
{"current_steps": 96, "total_steps": 980, "loss": 1.1389, "lr": 9.693877551020408e-06, "epoch": 3.4285714285714284, "percentage": 9.8, "elapsed_time": "0:05:56", "remaining_time": "0:54:40"}
{"current_steps": 97, "total_steps": 980, "loss": 1.1914, "lr": 9.795918367346939e-06, "epoch": 3.4642857142857144, "percentage": 9.9, "elapsed_time": "0:05:59", "remaining_time": "0:54:33"}
{"current_steps": 98, "total_steps": 980, "loss": 1.1436, "lr": 9.89795918367347e-06, "epoch": 3.5, "percentage": 10.0, "elapsed_time": "0:06:03", "remaining_time": "0:54:30"}
{"current_steps": 99, "total_steps": 980, "loss": 1.3277, "lr": 1e-05, "epoch": 3.5357142857142856, "percentage": 10.1, "elapsed_time": "0:06:06", "remaining_time": "0:54:23"}
{"current_steps": 100, "total_steps": 980, "loss": 1.1546, "lr": 9.999968282268043e-06, "epoch": 3.571428571428571, "percentage": 10.2, "elapsed_time": "0:06:10", "remaining_time": "0:54:23"}
{"current_steps": 100, "total_steps": 980, "eval_loss": 1.2822846174240112, "epoch": 3.571428571428571, "percentage": 10.2, "elapsed_time": "0:06:11", "remaining_time": "0:54:27"}
{"current_steps": 101, "total_steps": 980, "loss": 1.2382, "lr": 9.999873129474573e-06, "epoch": 3.607142857142857, "percentage": 10.31, "elapsed_time": "0:07:05", "remaining_time": "1:01:39"}
{"current_steps": 102, "total_steps": 980, "loss": 1.3204, "lr": 9.999714542826806e-06, "epoch": 3.642857142857143, "percentage": 10.41, "elapsed_time": "0:07:09", "remaining_time": "1:01:35"}
{"current_steps": 103, "total_steps": 980, "loss": 1.1399, "lr": 9.999492524336743e-06, "epoch": 3.678571428571429, "percentage": 10.51, "elapsed_time": "0:07:13", "remaining_time": "1:01:30"}
{"current_steps": 104, "total_steps": 980, "loss": 1.1609, "lr": 9.999207076821155e-06, "epoch": 3.7142857142857144, "percentage": 10.61, "elapsed_time": "0:07:17", "remaining_time": "1:01:26"}
{"current_steps": 105, "total_steps": 980, "loss": 1.1709, "lr": 9.99885820390154e-06, "epoch": 3.75, "percentage": 10.71, "elapsed_time": "0:07:21", "remaining_time": "1:01:22"}
{"current_steps": 106, "total_steps": 980, "loss": 1.2304, "lr": 9.998445910004082e-06, "epoch": 3.7857142857142856, "percentage": 10.82, "elapsed_time": "0:07:25", "remaining_time": "1:01:10"}
{"current_steps": 107, "total_steps": 980, "loss": 1.2702, "lr": 9.997970200359592e-06, "epoch": 3.821428571428571, "percentage": 10.92, "elapsed_time": "0:07:28", "remaining_time": "1:00:57"}
{"current_steps": 108, "total_steps": 980, "loss": 1.2122, "lr": 9.99743108100344e-06, "epoch": 3.857142857142857, "percentage": 11.02, "elapsed_time": "0:07:31", "remaining_time": "1:00:46"}
{"current_steps": 109, "total_steps": 980, "loss": 1.2045, "lr": 9.996828558775486e-06, "epoch": 3.892857142857143, "percentage": 11.12, "elapsed_time": "0:07:34", "remaining_time": "1:00:35"}
{"current_steps": 110, "total_steps": 980, "loss": 1.1833, "lr": 9.996162641319985e-06, "epoch": 3.928571428571429, "percentage": 11.22, "elapsed_time": "0:07:38", "remaining_time": "1:00:28"}
{"current_steps": 111, "total_steps": 980, "loss": 1.1361, "lr": 9.995433337085492e-06, "epoch": 3.9642857142857144, "percentage": 11.33, "elapsed_time": "0:07:43", "remaining_time": "1:00:24"}
{"current_steps": 112, "total_steps": 980, "loss": 1.1751, "lr": 9.994640655324758e-06, "epoch": 4.0, "percentage": 11.43, "elapsed_time": "0:07:46", "remaining_time": "1:00:15"}
{"current_steps": 113, "total_steps": 980, "loss": 1.0578, "lr": 9.993784606094612e-06, "epoch": 4.035714285714286, "percentage": 11.53, "elapsed_time": "0:07:50", "remaining_time": "1:00:11"}
{"current_steps": 114, "total_steps": 980, "loss": 1.0855, "lr": 9.992865200255829e-06, "epoch": 4.071428571428571, "percentage": 11.63, "elapsed_time": "0:07:53", "remaining_time": "0:59:59"}
{"current_steps": 115, "total_steps": 980, "loss": 1.0501, "lr": 9.991882449472994e-06, "epoch": 4.107142857142857, "percentage": 11.73, "elapsed_time": "0:07:57", "remaining_time": "0:59:48"}
{"current_steps": 116, "total_steps": 980, "loss": 1.0903, "lr": 9.99083636621436e-06, "epoch": 4.142857142857143, "percentage": 11.84, "elapsed_time": "0:08:01", "remaining_time": "0:59:44"}
{"current_steps": 117, "total_steps": 980, "loss": 1.0142, "lr": 9.989726963751683e-06, "epoch": 4.178571428571429, "percentage": 11.94, "elapsed_time": "0:08:04", "remaining_time": "0:59:35"}
{"current_steps": 118, "total_steps": 980, "loss": 1.03, "lr": 9.988554256160052e-06, "epoch": 4.214285714285714, "percentage": 12.04, "elapsed_time": "0:08:08", "remaining_time": "0:59:31"}
{"current_steps": 119, "total_steps": 980, "loss": 1.0143, "lr": 9.987318258317718e-06, "epoch": 4.25, "percentage": 12.14, "elapsed_time": "0:08:12", "remaining_time": "0:59:20"}
{"current_steps": 120, "total_steps": 980, "loss": 0.9545, "lr": 9.986018985905901e-06, "epoch": 4.285714285714286, "percentage": 12.24, "elapsed_time": "0:08:15", "remaining_time": "0:59:10"}
{"current_steps": 121, "total_steps": 980, "loss": 0.969, "lr": 9.984656455408591e-06, "epoch": 4.321428571428571, "percentage": 12.35, "elapsed_time": "0:08:18", "remaining_time": "0:58:59"}
{"current_steps": 122, "total_steps": 980, "loss": 1.1886, "lr": 9.983230684112338e-06, "epoch": 4.357142857142857, "percentage": 12.45, "elapsed_time": "0:08:22", "remaining_time": "0:58:50"}
{"current_steps": 123, "total_steps": 980, "loss": 0.9773, "lr": 9.981741690106035e-06, "epoch": 4.392857142857143, "percentage": 12.55, "elapsed_time": "0:08:25", "remaining_time": "0:58:43"}
{"current_steps": 124, "total_steps": 980, "loss": 1.0976, "lr": 9.980189492280688e-06, "epoch": 4.428571428571429, "percentage": 12.65, "elapsed_time": "0:08:29", "remaining_time": "0:58:34"}
{"current_steps": 125, "total_steps": 980, "loss": 0.9478, "lr": 9.978574110329174e-06, "epoch": 4.464285714285714, "percentage": 12.76, "elapsed_time": "0:08:32", "remaining_time": "0:58:24"}
{"current_steps": 126, "total_steps": 980, "loss": 0.9368, "lr": 9.976895564745993e-06, "epoch": 4.5, "percentage": 12.86, "elapsed_time": "0:08:35", "remaining_time": "0:58:13"}
{"current_steps": 127, "total_steps": 980, "loss": 1.0447, "lr": 9.975153876827008e-06, "epoch": 4.535714285714286, "percentage": 12.96, "elapsed_time": "0:08:38", "remaining_time": "0:58:04"}
{"current_steps": 128, "total_steps": 980, "loss": 1.0044, "lr": 9.973349068669178e-06, "epoch": 4.571428571428571, "percentage": 13.06, "elapsed_time": "0:08:42", "remaining_time": "0:57:58"}
{"current_steps": 129, "total_steps": 980, "loss": 1.0712, "lr": 9.97148116317027e-06, "epoch": 4.607142857142857, "percentage": 13.16, "elapsed_time": "0:08:46", "remaining_time": "0:57:55"}
{"current_steps": 130, "total_steps": 980, "loss": 0.9705, "lr": 9.969550184028572e-06, "epoch": 4.642857142857143, "percentage": 13.27, "elapsed_time": "0:08:50", "remaining_time": "0:57:46"}
{"current_steps": 131, "total_steps": 980, "loss": 1.0405, "lr": 9.9675561557426e-06, "epoch": 4.678571428571429, "percentage": 13.37, "elapsed_time": "0:08:53", "remaining_time": "0:57:36"}
{"current_steps": 132, "total_steps": 980, "loss": 1.0283, "lr": 9.965499103610775e-06, "epoch": 4.714285714285714, "percentage": 13.47, "elapsed_time": "0:08:57", "remaining_time": "0:57:33"}
{"current_steps": 133, "total_steps": 980, "loss": 1.0334, "lr": 9.963379053731104e-06, "epoch": 4.75, "percentage": 13.57, "elapsed_time": "0:09:00", "remaining_time": "0:57:24"}
{"current_steps": 134, "total_steps": 980, "loss": 1.1302, "lr": 9.961196033000862e-06, "epoch": 4.785714285714286, "percentage": 13.67, "elapsed_time": "0:09:04", "remaining_time": "0:57:16"}
{"current_steps": 135, "total_steps": 980, "loss": 0.9444, "lr": 9.95895006911623e-06, "epoch": 4.821428571428571, "percentage": 13.78, "elapsed_time": "0:09:08", "remaining_time": "0:57:10"}
{"current_steps": 136, "total_steps": 980, "loss": 0.9612, "lr": 9.956641190571967e-06, "epoch": 4.857142857142857, "percentage": 13.88, "elapsed_time": "0:09:11", "remaining_time": "0:57:04"}
{"current_steps": 137, "total_steps": 980, "loss": 1.0558, "lr": 9.954269426661023e-06, "epoch": 4.892857142857143, "percentage": 13.98, "elapsed_time": "0:09:16", "remaining_time": "0:57:02"}
{"current_steps": 138, "total_steps": 980, "loss": 0.9476, "lr": 9.951834807474191e-06, "epoch": 4.928571428571429, "percentage": 14.08, "elapsed_time": "0:09:20", "remaining_time": "0:57:00"}
{"current_steps": 139, "total_steps": 980, "loss": 0.994, "lr": 9.949337363899709e-06, "epoch": 4.964285714285714, "percentage": 14.18, "elapsed_time": "0:09:23", "remaining_time": "0:56:51"}
{"current_steps": 140, "total_steps": 980, "loss": 0.8216, "lr": 9.946777127622874e-06, "epoch": 5.0, "percentage": 14.29, "elapsed_time": "0:09:28", "remaining_time": "0:56:48"}
{"current_steps": 141, "total_steps": 980, "loss": 0.8672, "lr": 9.944154131125643e-06, "epoch": 5.035714285714286, "percentage": 14.39, "elapsed_time": "0:09:31", "remaining_time": "0:56:40"}
{"current_steps": 142, "total_steps": 980, "loss": 0.824, "lr": 9.941468407686216e-06, "epoch": 5.071428571428571, "percentage": 14.49, "elapsed_time": "0:09:35", "remaining_time": "0:56:36"}
{"current_steps": 143, "total_steps": 980, "loss": 0.8532, "lr": 9.938719991378614e-06, "epoch": 5.107142857142857, "percentage": 14.59, "elapsed_time": "0:09:39", "remaining_time": "0:56:30"}
{"current_steps": 144, "total_steps": 980, "loss": 0.9036, "lr": 9.935908917072253e-06, "epoch": 5.142857142857143, "percentage": 14.69, "elapsed_time": "0:09:43", "remaining_time": "0:56:28"}
{"current_steps": 145, "total_steps": 980, "loss": 0.8404, "lr": 9.933035220431489e-06, "epoch": 5.178571428571429, "percentage": 14.8, "elapsed_time": "0:09:47", "remaining_time": "0:56:23"}
{"current_steps": 146, "total_steps": 980, "loss": 0.8397, "lr": 9.930098937915177e-06, "epoch": 5.214285714285714, "percentage": 14.9, "elapsed_time": "0:09:50", "remaining_time": "0:56:14"}
{"current_steps": 147, "total_steps": 980, "loss": 0.8126, "lr": 9.927100106776213e-06, "epoch": 5.25, "percentage": 15.0, "elapsed_time": "0:09:54", "remaining_time": "0:56:07"}
{"current_steps": 148, "total_steps": 980, "loss": 0.8103, "lr": 9.924038765061042e-06, "epoch": 5.285714285714286, "percentage": 15.1, "elapsed_time": "0:09:58", "remaining_time": "0:56:02"}
{"current_steps": 149, "total_steps": 980, "loss": 0.7544, "lr": 9.920914951609189e-06, "epoch": 5.321428571428571, "percentage": 15.2, "elapsed_time": "0:10:01", "remaining_time": "0:55:56"}
{"current_steps": 150, "total_steps": 980, "loss": 0.8543, "lr": 9.917728706052765e-06, "epoch": 5.357142857142857, "percentage": 15.31, "elapsed_time": "0:10:05", "remaining_time": "0:55:48"}
{"current_steps": 151, "total_steps": 980, "loss": 0.7868, "lr": 9.914480068815964e-06, "epoch": 5.392857142857143, "percentage": 15.41, "elapsed_time": "0:10:09", "remaining_time": "0:55:45"}
{"current_steps": 152, "total_steps": 980, "loss": 0.7768, "lr": 9.91116908111455e-06, "epoch": 5.428571428571429, "percentage": 15.51, "elapsed_time": "0:10:12", "remaining_time": "0:55:37"}
{"current_steps": 153, "total_steps": 980, "loss": 0.8077, "lr": 9.907795784955327e-06, "epoch": 5.464285714285714, "percentage": 15.61, "elapsed_time": "0:10:16", "remaining_time": "0:55:33"}
{"current_steps": 154, "total_steps": 980, "loss": 0.7622, "lr": 9.90436022313562e-06, "epoch": 5.5, "percentage": 15.71, "elapsed_time": "0:10:20", "remaining_time": "0:55:27"}
{"current_steps": 155, "total_steps": 980, "loss": 0.8162, "lr": 9.900862439242719e-06, "epoch": 5.535714285714286, "percentage": 15.82, "elapsed_time": "0:10:24", "remaining_time": "0:55:24"}
{"current_steps": 156, "total_steps": 980, "loss": 0.7768, "lr": 9.897302477653334e-06, "epoch": 5.571428571428571, "percentage": 15.92, "elapsed_time": "0:10:28", "remaining_time": "0:55:19"}
{"current_steps": 157, "total_steps": 980, "loss": 0.8367, "lr": 9.893680383533027e-06, "epoch": 5.607142857142857, "percentage": 16.02, "elapsed_time": "0:10:32", "remaining_time": "0:55:15"}
{"current_steps": 158, "total_steps": 980, "loss": 0.752, "lr": 9.889996202835642e-06, "epoch": 5.642857142857143, "percentage": 16.12, "elapsed_time": "0:10:36", "remaining_time": "0:55:09"}
{"current_steps": 159, "total_steps": 980, "loss": 0.878, "lr": 9.88624998230272e-06, "epoch": 5.678571428571429, "percentage": 16.22, "elapsed_time": "0:10:39", "remaining_time": "0:55:01"}
{"current_steps": 160, "total_steps": 980, "loss": 0.7647, "lr": 9.882441769462911e-06, "epoch": 5.714285714285714, "percentage": 16.33, "elapsed_time": "0:10:43", "remaining_time": "0:54:57"}
{"current_steps": 161, "total_steps": 980, "loss": 0.8364, "lr": 9.878571612631364e-06, "epoch": 5.75, "percentage": 16.43, "elapsed_time": "0:10:47", "remaining_time": "0:54:54"}
{"current_steps": 162, "total_steps": 980, "loss": 0.8453, "lr": 9.874639560909118e-06, "epoch": 5.785714285714286, "percentage": 16.53, "elapsed_time": "0:10:50", "remaining_time": "0:54:46"}
{"current_steps": 163, "total_steps": 980, "loss": 0.76, "lr": 9.870645664182478e-06, "epoch": 5.821428571428571, "percentage": 16.63, "elapsed_time": "0:10:55", "remaining_time": "0:54:44"}
{"current_steps": 164, "total_steps": 980, "loss": 0.7596, "lr": 9.86658997312238e-06, "epoch": 5.857142857142857, "percentage": 16.73, "elapsed_time": "0:10:58", "remaining_time": "0:54:37"}
{"current_steps": 165, "total_steps": 980, "loss": 0.8612, "lr": 9.862472539183757e-06, "epoch": 5.892857142857143, "percentage": 16.84, "elapsed_time": "0:11:01", "remaining_time": "0:54:29"}
{"current_steps": 166, "total_steps": 980, "loss": 0.8048, "lr": 9.858293414604871e-06, "epoch": 5.928571428571429, "percentage": 16.94, "elapsed_time": "0:11:05", "remaining_time": "0:54:24"}
{"current_steps": 167, "total_steps": 980, "loss": 0.7531, "lr": 9.854052652406666e-06, "epoch": 5.964285714285714, "percentage": 17.04, "elapsed_time": "0:11:08", "remaining_time": "0:54:15"}
{"current_steps": 168, "total_steps": 980, "loss": 0.6251, "lr": 9.849750306392085e-06, "epoch": 6.0, "percentage": 17.14, "elapsed_time": "0:11:12", "remaining_time": "0:54:09"}
{"current_steps": 169, "total_steps": 980, "loss": 0.6708, "lr": 9.84538643114539e-06, "epoch": 6.035714285714286, "percentage": 17.24, "elapsed_time": "0:11:15", "remaining_time": "0:54:01"}
{"current_steps": 170, "total_steps": 980, "loss": 0.6973, "lr": 9.840961082031473e-06, "epoch": 6.071428571428571, "percentage": 17.35, "elapsed_time": "0:11:19", "remaining_time": "0:53:56"}
{"current_steps": 171, "total_steps": 980, "loss": 0.6517, "lr": 9.836474315195148e-06, "epoch": 6.107142857142857, "percentage": 17.45, "elapsed_time": "0:11:22", "remaining_time": "0:53:47"}
{"current_steps": 172, "total_steps": 980, "loss": 0.6084, "lr": 9.831926187560441e-06, "epoch": 6.142857142857143, "percentage": 17.55, "elapsed_time": "0:11:26", "remaining_time": "0:53:42"}
{"current_steps": 173, "total_steps": 980, "loss": 0.5943, "lr": 9.827316756829871e-06, "epoch": 6.178571428571429, "percentage": 17.65, "elapsed_time": "0:11:29", "remaining_time": "0:53:38"}
{"current_steps": 174, "total_steps": 980, "loss": 0.6451, "lr": 9.822646081483713e-06, "epoch": 6.214285714285714, "percentage": 17.76, "elapsed_time": "0:11:34", "remaining_time": "0:53:35"}
{"current_steps": 175, "total_steps": 980, "loss": 0.6001, "lr": 9.817914220779258e-06, "epoch": 6.25, "percentage": 17.86, "elapsed_time": "0:11:37", "remaining_time": "0:53:28"}
{"current_steps": 176, "total_steps": 980, "loss": 0.5976, "lr": 9.81312123475006e-06, "epoch": 6.285714285714286, "percentage": 17.96, "elapsed_time": "0:11:41", "remaining_time": "0:53:23"}
{"current_steps": 177, "total_steps": 980, "loss": 0.5813, "lr": 9.808267184205182e-06, "epoch": 6.321428571428571, "percentage": 18.06, "elapsed_time": "0:11:44", "remaining_time": "0:53:17"}
{"current_steps": 178, "total_steps": 980, "loss": 0.5511, "lr": 9.80335213072841e-06, "epoch": 6.357142857142857, "percentage": 18.16, "elapsed_time": "0:11:48", "remaining_time": "0:53:14"}
{"current_steps": 179, "total_steps": 980, "loss": 0.5579, "lr": 9.798376136677486e-06, "epoch": 6.392857142857143, "percentage": 18.27, "elapsed_time": "0:11:52", "remaining_time": "0:53:07"}
{"current_steps": 180, "total_steps": 980, "loss": 0.527, "lr": 9.793339265183303e-06, "epoch": 6.428571428571429, "percentage": 18.37, "elapsed_time": "0:11:56", "remaining_time": "0:53:04"}
{"current_steps": 181, "total_steps": 980, "loss": 0.5881, "lr": 9.788241580149123e-06, "epoch": 6.464285714285714, "percentage": 18.47, "elapsed_time": "0:12:00", "remaining_time": "0:52:58"}
{"current_steps": 182, "total_steps": 980, "loss": 0.5526, "lr": 9.783083146249749e-06, "epoch": 6.5, "percentage": 18.57, "elapsed_time": "0:12:03", "remaining_time": "0:52:51"}
{"current_steps": 183, "total_steps": 980, "loss": 0.5739, "lr": 9.777864028930705e-06, "epoch": 6.535714285714286, "percentage": 18.67, "elapsed_time": "0:12:06", "remaining_time": "0:52:45"}
{"current_steps": 184, "total_steps": 980, "loss": 0.5514, "lr": 9.77258429440742e-06, "epoch": 6.571428571428571, "percentage": 18.78, "elapsed_time": "0:12:10", "remaining_time": "0:52:41"}
{"current_steps": 185, "total_steps": 980, "loss": 0.566, "lr": 9.767244009664376e-06, "epoch": 6.607142857142857, "percentage": 18.88, "elapsed_time": "0:12:14", "remaining_time": "0:52:36"}
{"current_steps": 186, "total_steps": 980, "loss": 0.596, "lr": 9.761843242454261e-06, "epoch": 6.642857142857143, "percentage": 18.98, "elapsed_time": "0:12:17", "remaining_time": "0:52:30"}
{"current_steps": 187, "total_steps": 980, "loss": 0.5865, "lr": 9.75638206129711e-06, "epoch": 6.678571428571429, "percentage": 19.08, "elapsed_time": "0:12:22", "remaining_time": "0:52:27"}
{"current_steps": 188, "total_steps": 980, "loss": 0.6362, "lr": 9.750860535479434e-06, "epoch": 6.714285714285714, "percentage": 19.18, "elapsed_time": "0:12:25", "remaining_time": "0:52:21"}
{"current_steps": 189, "total_steps": 980, "loss": 0.5731, "lr": 9.745278735053345e-06, "epoch": 6.75, "percentage": 19.29, "elapsed_time": "0:12:29", "remaining_time": "0:52:15"}
{"current_steps": 190, "total_steps": 980, "loss": 0.5541, "lr": 9.73963673083566e-06, "epoch": 6.785714285714286, "percentage": 19.39, "elapsed_time": "0:12:33", "remaining_time": "0:52:12"}
{"current_steps": 191, "total_steps": 980, "loss": 0.5517, "lr": 9.733934594407012e-06, "epoch": 6.821428571428571, "percentage": 19.49, "elapsed_time": "0:12:38", "remaining_time": "0:52:11"}
{"current_steps": 192, "total_steps": 980, "loss": 0.5111, "lr": 9.728172398110935e-06, "epoch": 6.857142857142857, "percentage": 19.59, "elapsed_time": "0:12:42", "remaining_time": "0:52:09"}
{"current_steps": 193, "total_steps": 980, "loss": 0.5726, "lr": 9.722350215052946e-06, "epoch": 6.892857142857143, "percentage": 19.69, "elapsed_time": "0:12:45", "remaining_time": "0:52:02"}
{"current_steps": 194, "total_steps": 980, "loss": 0.5435, "lr": 9.716468119099626e-06, "epoch": 6.928571428571429, "percentage": 19.8, "elapsed_time": "0:12:49", "remaining_time": "0:51:56"}
{"current_steps": 195, "total_steps": 980, "loss": 0.5764, "lr": 9.710526184877667e-06, "epoch": 6.964285714285714, "percentage": 19.9, "elapsed_time": "0:12:53", "remaining_time": "0:51:53"}
{"current_steps": 196, "total_steps": 980, "loss": 0.4543, "lr": 9.704524487772944e-06, "epoch": 7.0, "percentage": 20.0, "elapsed_time": "0:12:56", "remaining_time": "0:51:46"}
{"current_steps": 197, "total_steps": 980, "loss": 0.3993, "lr": 9.698463103929542e-06, "epoch": 7.035714285714286, "percentage": 20.1, "elapsed_time": "0:12:59", "remaining_time": "0:51:40"}
{"current_steps": 198, "total_steps": 980, "loss": 0.3759, "lr": 9.692342110248802e-06, "epoch": 7.071428571428571, "percentage": 20.2, "elapsed_time": "0:13:03", "remaining_time": "0:51:33"}
{"current_steps": 199, "total_steps": 980, "loss": 0.35, "lr": 9.68616158438834e-06, "epoch": 7.107142857142857, "percentage": 20.31, "elapsed_time": "0:13:07", "remaining_time": "0:51:29"}
{"current_steps": 200, "total_steps": 980, "loss": 0.4067, "lr": 9.679921604761056e-06, "epoch": 7.142857142857143, "percentage": 20.41, "elapsed_time": "0:13:11", "remaining_time": "0:51:26"}
{"current_steps": 200, "total_steps": 980, "eval_loss": 1.6618373394012451, "epoch": 7.142857142857143, "percentage": 20.41, "elapsed_time": "0:13:11", "remaining_time": "0:51:28"}
{"current_steps": 201, "total_steps": 980, "loss": 0.3858, "lr": 9.673622250534155e-06, "epoch": 7.178571428571429, "percentage": 20.51, "elapsed_time": "0:14:02", "remaining_time": "0:54:23"}
{"current_steps": 202, "total_steps": 980, "loss": 0.3662, "lr": 9.66726360162813e-06, "epoch": 7.214285714285714, "percentage": 20.61, "elapsed_time": "0:14:05", "remaining_time": "0:54:17"}
{"current_steps": 203, "total_steps": 980, "loss": 0.3926, "lr": 9.660845738715743e-06, "epoch": 7.25, "percentage": 20.71, "elapsed_time": "0:14:09", "remaining_time": "0:54:09"}
{"current_steps": 204, "total_steps": 980, "loss": 0.4011, "lr": 9.654368743221022e-06, "epoch": 7.285714285714286, "percentage": 20.82, "elapsed_time": "0:14:12", "remaining_time": "0:54:01"}
{"current_steps": 205, "total_steps": 980, "loss": 0.3561, "lr": 9.647832697318207e-06, "epoch": 7.321428571428571, "percentage": 20.92, "elapsed_time": "0:14:15", "remaining_time": "0:53:54"}
{"current_steps": 206, "total_steps": 980, "loss": 0.397, "lr": 9.641237683930722e-06, "epoch": 7.357142857142857, "percentage": 21.02, "elapsed_time": "0:14:18", "remaining_time": "0:53:46"}
{"current_steps": 207, "total_steps": 980, "loss": 0.3405, "lr": 9.63458378673011e-06, "epoch": 7.392857142857143, "percentage": 21.12, "elapsed_time": "0:14:22", "remaining_time": "0:53:40"}
{"current_steps": 208, "total_steps": 980, "loss": 0.327, "lr": 9.627871090134984e-06, "epoch": 7.428571428571429, "percentage": 21.22, "elapsed_time": "0:14:26", "remaining_time": "0:53:36"}
{"current_steps": 209, "total_steps": 980, "loss": 0.3921, "lr": 9.621099679309948e-06, "epoch": 7.464285714285714, "percentage": 21.33, "elapsed_time": "0:14:30", "remaining_time": "0:53:30"}
{"current_steps": 210, "total_steps": 980, "loss": 0.3775, "lr": 9.61426964016452e-06, "epoch": 7.5, "percentage": 21.43, "elapsed_time": "0:14:33", "remaining_time": "0:53:23"}
{"current_steps": 211, "total_steps": 980, "loss": 0.3586, "lr": 9.60738105935204e-06, "epoch": 7.535714285714286, "percentage": 21.53, "elapsed_time": "0:14:37", "remaining_time": "0:53:18"}
{"current_steps": 212, "total_steps": 980, "loss": 0.3626, "lr": 9.60043402426857e-06, "epoch": 7.571428571428571, "percentage": 21.63, "elapsed_time": "0:14:41", "remaining_time": "0:53:14"}
{"current_steps": 213, "total_steps": 980, "loss": 0.3889, "lr": 9.593428623051793e-06, "epoch": 7.607142857142857, "percentage": 21.73, "elapsed_time": "0:14:45", "remaining_time": "0:53:09"}
{"current_steps": 214, "total_steps": 980, "loss": 0.4192, "lr": 9.58636494457988e-06, "epoch": 7.642857142857143, "percentage": 21.84, "elapsed_time": "0:14:48", "remaining_time": "0:53:01"}
{"current_steps": 215, "total_steps": 980, "loss": 0.408, "lr": 9.57924307847038e-06, "epoch": 7.678571428571429, "percentage": 21.94, "elapsed_time": "0:14:53", "remaining_time": "0:52:57"}
{"current_steps": 216, "total_steps": 980, "loss": 0.3425, "lr": 9.572063115079063e-06, "epoch": 7.714285714285714, "percentage": 22.04, "elapsed_time": "0:14:56", "remaining_time": "0:52:52"}
{"current_steps": 217, "total_steps": 980, "loss": 0.3447, "lr": 9.564825145498795e-06, "epoch": 7.75, "percentage": 22.14, "elapsed_time": "0:15:00", "remaining_time": "0:52:45"}
{"current_steps": 218, "total_steps": 980, "loss": 0.3816, "lr": 9.557529261558367e-06, "epoch": 7.785714285714286, "percentage": 22.24, "elapsed_time": "0:15:03", "remaining_time": "0:52:38"}
{"current_steps": 219, "total_steps": 980, "loss": 0.3568, "lr": 9.550175555821333e-06, "epoch": 7.821428571428571, "percentage": 22.35, "elapsed_time": "0:15:06", "remaining_time": "0:52:31"}
{"current_steps": 220, "total_steps": 980, "loss": 0.4127, "lr": 9.542764121584845e-06, "epoch": 7.857142857142857, "percentage": 22.45, "elapsed_time": "0:15:10", "remaining_time": "0:52:26"}
{"current_steps": 221, "total_steps": 980, "loss": 0.3844, "lr": 9.53529505287845e-06, "epoch": 7.892857142857143, "percentage": 22.55, "elapsed_time": "0:15:14", "remaining_time": "0:52:19"}
{"current_steps": 222, "total_steps": 980, "loss": 0.3597, "lr": 9.527768444462922e-06, "epoch": 7.928571428571429, "percentage": 22.65, "elapsed_time": "0:15:17", "remaining_time": "0:52:12"}
{"current_steps": 223, "total_steps": 980, "loss": 0.4019, "lr": 9.520184391829037e-06, "epoch": 7.964285714285714, "percentage": 22.76, "elapsed_time": "0:15:21", "remaining_time": "0:52:08"}
{"current_steps": 224, "total_steps": 980, "loss": 0.2579, "lr": 9.512542991196377e-06, "epoch": 8.0, "percentage": 22.86, "elapsed_time": "0:15:24", "remaining_time": "0:52:01"}
{"current_steps": 225, "total_steps": 980, "loss": 0.2908, "lr": 9.504844339512096e-06, "epoch": 8.035714285714286, "percentage": 22.96, "elapsed_time": "0:15:28", "remaining_time": "0:51:56"}
{"current_steps": 226, "total_steps": 980, "loss": 0.2495, "lr": 9.497088534449707e-06, "epoch": 8.071428571428571, "percentage": 23.06, "elapsed_time": "0:15:31", "remaining_time": "0:51:49"}
{"current_steps": 227, "total_steps": 980, "loss": 0.2688, "lr": 9.489275674407826e-06, "epoch": 8.107142857142858, "percentage": 23.16, "elapsed_time": "0:15:35", "remaining_time": "0:51:43"}
{"current_steps": 228, "total_steps": 980, "loss": 0.2262, "lr": 9.481405858508935e-06, "epoch": 8.142857142857142, "percentage": 23.27, "elapsed_time": "0:15:38", "remaining_time": "0:51:37"}
{"current_steps": 229, "total_steps": 980, "loss": 0.2447, "lr": 9.473479186598115e-06, "epoch": 8.178571428571429, "percentage": 23.37, "elapsed_time": "0:15:42", "remaining_time": "0:51:30"}
{"current_steps": 230, "total_steps": 980, "loss": 0.2446, "lr": 9.465495759241793e-06, "epoch": 8.214285714285714, "percentage": 23.47, "elapsed_time": "0:15:45", "remaining_time": "0:51:24"}
{"current_steps": 231, "total_steps": 980, "loss": 0.2381, "lr": 9.457455677726447e-06, "epoch": 8.25, "percentage": 23.57, "elapsed_time": "0:15:50", "remaining_time": "0:51:20"}
{"current_steps": 232, "total_steps": 980, "loss": 0.2048, "lr": 9.449359044057344e-06, "epoch": 8.285714285714286, "percentage": 23.67, "elapsed_time": "0:15:53", "remaining_time": "0:51:15"}
{"current_steps": 233, "total_steps": 980, "loss": 0.2285, "lr": 9.441205960957221e-06, "epoch": 8.321428571428571, "percentage": 23.78, "elapsed_time": "0:15:58", "remaining_time": "0:51:11"}
{"current_steps": 234, "total_steps": 980, "loss": 0.2356, "lr": 9.432996531865001e-06, "epoch": 8.357142857142858, "percentage": 23.88, "elapsed_time": "0:16:01", "remaining_time": "0:51:04"}
{"current_steps": 235, "total_steps": 980, "loss": 0.2461, "lr": 9.424730860934474e-06, "epoch": 8.392857142857142, "percentage": 23.98, "elapsed_time": "0:16:04", "remaining_time": "0:50:57"}
{"current_steps": 236, "total_steps": 980, "loss": 0.2078, "lr": 9.416409053032971e-06, "epoch": 8.428571428571429, "percentage": 24.08, "elapsed_time": "0:16:07", "remaining_time": "0:50:51"}
{"current_steps": 237, "total_steps": 980, "loss": 0.2085, "lr": 9.408031213740045e-06, "epoch": 8.464285714285714, "percentage": 24.18, "elapsed_time": "0:16:12", "remaining_time": "0:50:47"}
{"current_steps": 238, "total_steps": 980, "loss": 0.2101, "lr": 9.399597449346119e-06, "epoch": 8.5, "percentage": 24.29, "elapsed_time": "0:16:16", "remaining_time": "0:50:44"}
{"current_steps": 239, "total_steps": 980, "loss": 0.2305, "lr": 9.391107866851143e-06, "epoch": 8.535714285714286, "percentage": 24.39, "elapsed_time": "0:16:19", "remaining_time": "0:50:37"}
{"current_steps": 240, "total_steps": 980, "loss": 0.2392, "lr": 9.382562573963238e-06, "epoch": 8.571428571428571, "percentage": 24.49, "elapsed_time": "0:16:24", "remaining_time": "0:50:34"}
{"current_steps": 241, "total_steps": 980, "loss": 0.2314, "lr": 9.37396167909733e-06, "epoch": 8.607142857142858, "percentage": 24.59, "elapsed_time": "0:16:28", "remaining_time": "0:50:30"}
{"current_steps": 242, "total_steps": 980, "loss": 0.2831, "lr": 9.365305291373769e-06, "epoch": 8.642857142857142, "percentage": 24.69, "elapsed_time": "0:16:32", "remaining_time": "0:50:25"}
{"current_steps": 243, "total_steps": 980, "loss": 0.2016, "lr": 9.356593520616948e-06, "epoch": 8.678571428571429, "percentage": 24.8, "elapsed_time": "0:16:35", "remaining_time": "0:50:19"}
{"current_steps": 244, "total_steps": 980, "loss": 0.1895, "lr": 9.347826477353911e-06, "epoch": 8.714285714285714, "percentage": 24.9, "elapsed_time": "0:16:39", "remaining_time": "0:50:13"}
{"current_steps": 245, "total_steps": 980, "loss": 0.2404, "lr": 9.33900427281295e-06, "epoch": 8.75, "percentage": 25.0, "elapsed_time": "0:16:42", "remaining_time": "0:50:07"}
{"current_steps": 246, "total_steps": 980, "loss": 0.2037, "lr": 9.330127018922195e-06, "epoch": 8.785714285714286, "percentage": 25.1, "elapsed_time": "0:16:45", "remaining_time": "0:50:00"}
{"current_steps": 247, "total_steps": 980, "loss": 0.2165, "lr": 9.321194828308185e-06, "epoch": 8.821428571428571, "percentage": 25.2, "elapsed_time": "0:16:49", "remaining_time": "0:49:54"}
{"current_steps": 248, "total_steps": 980, "loss": 0.2109, "lr": 9.312207814294454e-06, "epoch": 8.857142857142858, "percentage": 25.31, "elapsed_time": "0:16:53", "remaining_time": "0:49:51"}
{"current_steps": 249, "total_steps": 980, "loss": 0.212, "lr": 9.303166090900082e-06, "epoch": 8.892857142857142, "percentage": 25.41, "elapsed_time": "0:16:56", "remaining_time": "0:49:44"}
{"current_steps": 250, "total_steps": 980, "loss": 0.2078, "lr": 9.294069772838253e-06, "epoch": 8.928571428571429, "percentage": 25.51, "elapsed_time": "0:17:00", "remaining_time": "0:49:39"}
{"current_steps": 251, "total_steps": 980, "loss": 0.2207, "lr": 9.284918975514798e-06, "epoch": 8.964285714285714, "percentage": 25.61, "elapsed_time": "0:17:04", "remaining_time": "0:49:35"}
{"current_steps": 252, "total_steps": 980, "loss": 0.1748, "lr": 9.275713815026732e-06, "epoch": 9.0, "percentage": 25.71, "elapsed_time": "0:17:08", "remaining_time": "0:49:30"}
{"current_steps": 253, "total_steps": 980, "loss": 0.1457, "lr": 9.266454408160779e-06, "epoch": 9.035714285714286, "percentage": 25.82, "elapsed_time": "0:17:11", "remaining_time": "0:49:24"}
{"current_steps": 254, "total_steps": 980, "loss": 0.1342, "lr": 9.257140872391895e-06, "epoch": 9.071428571428571, "percentage": 25.92, "elapsed_time": "0:17:15", "remaining_time": "0:49:18"}
{"current_steps": 255, "total_steps": 980, "loss": 0.1019, "lr": 9.24777332588177e-06, "epoch": 9.107142857142858, "percentage": 26.02, "elapsed_time": "0:17:18", "remaining_time": "0:49:13"}
{"current_steps": 256, "total_steps": 980, "loss": 0.1322, "lr": 9.238351887477338e-06, "epoch": 9.142857142857142, "percentage": 26.12, "elapsed_time": "0:17:22", "remaining_time": "0:49:07"}
{"current_steps": 257, "total_steps": 980, "loss": 0.1442, "lr": 9.22887667670926e-06, "epoch": 9.178571428571429, "percentage": 26.22, "elapsed_time": "0:17:25", "remaining_time": "0:49:02"}
{"current_steps": 258, "total_steps": 980, "loss": 0.1149, "lr": 9.219347813790416e-06, "epoch": 9.214285714285714, "percentage": 26.33, "elapsed_time": "0:17:30", "remaining_time": "0:48:59"}
{"current_steps": 259, "total_steps": 980, "loss": 0.1544, "lr": 9.209765419614375e-06, "epoch": 9.25, "percentage": 26.43, "elapsed_time": "0:17:33", "remaining_time": "0:48:53"}
{"current_steps": 260, "total_steps": 980, "loss": 0.1247, "lr": 9.200129615753858e-06, "epoch": 9.285714285714286, "percentage": 26.53, "elapsed_time": "0:17:36", "remaining_time": "0:48:47"}
{"current_steps": 261, "total_steps": 980, "loss": 0.1597, "lr": 9.190440524459203e-06, "epoch": 9.321428571428571, "percentage": 26.63, "elapsed_time": "0:17:40", "remaining_time": "0:48:40"}
{"current_steps": 262, "total_steps": 980, "loss": 0.1262, "lr": 9.180698268656814e-06, "epoch": 9.357142857142858, "percentage": 26.73, "elapsed_time": "0:17:43", "remaining_time": "0:48:34"}
{"current_steps": 263, "total_steps": 980, "loss": 0.1283, "lr": 9.170902971947589e-06, "epoch": 9.392857142857142, "percentage": 26.84, "elapsed_time": "0:17:47", "remaining_time": "0:48:31"}
{"current_steps": 264, "total_steps": 980, "loss": 0.1142, "lr": 9.16105475860537e-06, "epoch": 9.428571428571429, "percentage": 26.94, "elapsed_time": "0:17:51", "remaining_time": "0:48:24"}
{"current_steps": 265, "total_steps": 980, "loss": 0.1241, "lr": 9.151153753575351e-06, "epoch": 9.464285714285714, "percentage": 27.04, "elapsed_time": "0:17:54", "remaining_time": "0:48:20"}
{"current_steps": 266, "total_steps": 980, "loss": 0.1157, "lr": 9.141200082472503e-06, "epoch": 9.5, "percentage": 27.14, "elapsed_time": "0:17:58", "remaining_time": "0:48:15"}
{"current_steps": 267, "total_steps": 980, "loss": 0.1696, "lr": 9.131193871579975e-06, "epoch": 9.535714285714286, "percentage": 27.24, "elapsed_time": "0:18:02", "remaining_time": "0:48:09"}
{"current_steps": 268, "total_steps": 980, "loss": 0.1364, "lr": 9.121135247847492e-06, "epoch": 9.571428571428571, "percentage": 27.35, "elapsed_time": "0:18:05", "remaining_time": "0:48:04"}
{"current_steps": 269, "total_steps": 980, "loss": 0.1288, "lr": 9.111024338889748e-06, "epoch": 9.607142857142858, "percentage": 27.45, "elapsed_time": "0:18:09", "remaining_time": "0:47:58"}
{"current_steps": 270, "total_steps": 980, "loss": 0.1219, "lr": 9.10086127298478e-06, "epoch": 9.642857142857142, "percentage": 27.55, "elapsed_time": "0:18:13", "remaining_time": "0:47:55"}
{"current_steps": 271, "total_steps": 980, "loss": 0.1314, "lr": 9.090646179072352e-06, "epoch": 9.678571428571429, "percentage": 27.65, "elapsed_time": "0:18:17", "remaining_time": "0:47:50"}
{"current_steps": 272, "total_steps": 980, "loss": 0.1295, "lr": 9.080379186752304e-06, "epoch": 9.714285714285714, "percentage": 27.76, "elapsed_time": "0:18:21", "remaining_time": "0:47:46"}
{"current_steps": 273, "total_steps": 980, "loss": 0.1494, "lr": 9.070060426282924e-06, "epoch": 9.75, "percentage": 27.86, "elapsed_time": "0:18:25", "remaining_time": "0:47:43"}
{"current_steps": 274, "total_steps": 980, "loss": 0.1142, "lr": 9.059690028579285e-06, "epoch": 9.785714285714286, "percentage": 27.96, "elapsed_time": "0:18:28", "remaining_time": "0:47:37"}
{"current_steps": 275, "total_steps": 980, "loss": 0.1331, "lr": 9.049268125211577e-06, "epoch": 9.821428571428571, "percentage": 28.06, "elapsed_time": "0:18:32", "remaining_time": "0:47:31"}
{"current_steps": 276, "total_steps": 980, "loss": 0.158, "lr": 9.038794848403463e-06, "epoch": 9.857142857142858, "percentage": 28.16, "elapsed_time": "0:18:35", "remaining_time": "0:47:26"}
{"current_steps": 277, "total_steps": 980, "loss": 0.1281, "lr": 9.028270331030373e-06, "epoch": 9.892857142857142, "percentage": 28.27, "elapsed_time": "0:18:40", "remaining_time": "0:47:22"}
{"current_steps": 278, "total_steps": 980, "loss": 0.1477, "lr": 9.017694706617836e-06, "epoch": 9.928571428571429, "percentage": 28.37, "elapsed_time": "0:18:44", "remaining_time": "0:47:19"}
{"current_steps": 279, "total_steps": 980, "loss": 0.116, "lr": 9.007068109339783e-06, "epoch": 9.964285714285714, "percentage": 28.47, "elapsed_time": "0:18:48", "remaining_time": "0:47:14"}
{"current_steps": 280, "total_steps": 980, "loss": 0.0847, "lr": 8.996390674016839e-06, "epoch": 10.0, "percentage": 28.57, "elapsed_time": "0:18:51", "remaining_time": "0:47:08"}
{"current_steps": 281, "total_steps": 980, "loss": 0.0765, "lr": 8.985662536114614e-06, "epoch": 10.035714285714286, "percentage": 28.67, "elapsed_time": "0:18:55", "remaining_time": "0:47:03"}
{"current_steps": 282, "total_steps": 980, "loss": 0.086, "lr": 8.97488383174199e-06, "epoch": 10.071428571428571, "percentage": 28.78, "elapsed_time": "0:18:58", "remaining_time": "0:46:59"}
{"current_steps": 283, "total_steps": 980, "loss": 0.0736, "lr": 8.964054697649389e-06, "epoch": 10.107142857142858, "percentage": 28.88, "elapsed_time": "0:19:03", "remaining_time": "0:46:55"}
{"current_steps": 284, "total_steps": 980, "loss": 0.0702, "lr": 8.953175271227042e-06, "epoch": 10.142857142857142, "percentage": 28.98, "elapsed_time": "0:19:06", "remaining_time": "0:46:49"}
{"current_steps": 285, "total_steps": 980, "loss": 0.0662, "lr": 8.94224569050324e-06, "epoch": 10.178571428571429, "percentage": 29.08, "elapsed_time": "0:19:10", "remaining_time": "0:46:45"}
{"current_steps": 286, "total_steps": 980, "loss": 0.0878, "lr": 8.931266094142588e-06, "epoch": 10.214285714285714, "percentage": 29.18, "elapsed_time": "0:19:14", "remaining_time": "0:46:41"}
{"current_steps": 287, "total_steps": 980, "loss": 0.0716, "lr": 8.920236621444243e-06, "epoch": 10.25, "percentage": 29.29, "elapsed_time": "0:19:17", "remaining_time": "0:46:36"}
{"current_steps": 288, "total_steps": 980, "loss": 0.0769, "lr": 8.90915741234015e-06, "epoch": 10.285714285714286, "percentage": 29.39, "elapsed_time": "0:19:21", "remaining_time": "0:46:30"}
{"current_steps": 289, "total_steps": 980, "loss": 0.062, "lr": 8.89802860739326e-06, "epoch": 10.321428571428571, "percentage": 29.49, "elapsed_time": "0:19:25", "remaining_time": "0:46:27"}
{"current_steps": 290, "total_steps": 980, "loss": 0.0857, "lr": 8.88685034779576e-06, "epoch": 10.357142857142858, "percentage": 29.59, "elapsed_time": "0:19:28", "remaining_time": "0:46:21"}
{"current_steps": 291, "total_steps": 980, "loss": 0.0908, "lr": 8.87562277536726e-06, "epoch": 10.392857142857142, "percentage": 29.69, "elapsed_time": "0:19:33", "remaining_time": "0:46:17"}
{"current_steps": 292, "total_steps": 980, "loss": 0.068, "lr": 8.864346032553016e-06, "epoch": 10.428571428571429, "percentage": 29.8, "elapsed_time": "0:19:36", "remaining_time": "0:46:12"}
{"current_steps": 293, "total_steps": 980, "loss": 0.0696, "lr": 8.853020262422111e-06, "epoch": 10.464285714285714, "percentage": 29.9, "elapsed_time": "0:19:39", "remaining_time": "0:46:06"}
{"current_steps": 294, "total_steps": 980, "loss": 0.0803, "lr": 8.84164560866564e-06, "epoch": 10.5, "percentage": 30.0, "elapsed_time": "0:19:43", "remaining_time": "0:46:00"}
{"current_steps": 295, "total_steps": 980, "loss": 0.0984, "lr": 8.83022221559489e-06, "epoch": 10.535714285714286, "percentage": 30.1, "elapsed_time": "0:19:47", "remaining_time": "0:45:56"}
{"current_steps": 296, "total_steps": 980, "loss": 0.0675, "lr": 8.818750228139513e-06, "epoch": 10.571428571428571, "percentage": 30.2, "elapsed_time": "0:19:51", "remaining_time": "0:45:52"}
{"current_steps": 297, "total_steps": 980, "loss": 0.079, "lr": 8.807229791845673e-06, "epoch": 10.607142857142858, "percentage": 30.31, "elapsed_time": "0:19:54", "remaining_time": "0:45:46"}
{"current_steps": 298, "total_steps": 980, "loss": 0.0909, "lr": 8.795661052874217e-06, "epoch": 10.642857142857142, "percentage": 30.41, "elapsed_time": "0:19:57", "remaining_time": "0:45:40"}
{"current_steps": 299, "total_steps": 980, "loss": 0.079, "lr": 8.78404415799881e-06, "epoch": 10.678571428571429, "percentage": 30.51, "elapsed_time": "0:20:01", "remaining_time": "0:45:37"}
{"current_steps": 300, "total_steps": 980, "loss": 0.0978, "lr": 8.772379254604074e-06, "epoch": 10.714285714285714, "percentage": 30.61, "elapsed_time": "0:20:04", "remaining_time": "0:45:31"}
{"current_steps": 300, "total_steps": 980, "eval_loss": 2.0024502277374268, "epoch": 10.714285714285714, "percentage": 30.61, "elapsed_time": "0:20:05", "remaining_time": "0:45:32"}
{"current_steps": 301, "total_steps": 980, "loss": 0.0926, "lr": 8.76066649068372e-06, "epoch": 10.75, "percentage": 30.71, "elapsed_time": "0:20:54", "remaining_time": "0:47:10"}
{"current_steps": 302, "total_steps": 980, "loss": 0.0895, "lr": 8.748906014838672e-06, "epoch": 10.785714285714286, "percentage": 30.82, "elapsed_time": "0:20:58", "remaining_time": "0:47:04"}
{"current_steps": 303, "total_steps": 980, "loss": 0.0765, "lr": 8.737097976275177e-06, "epoch": 10.821428571428571, "percentage": 30.92, "elapsed_time": "0:21:01", "remaining_time": "0:46:59"}
{"current_steps": 304, "total_steps": 980, "loss": 0.081, "lr": 8.725242524802919e-06, "epoch": 10.857142857142858, "percentage": 31.02, "elapsed_time": "0:21:05", "remaining_time": "0:46:53"}
{"current_steps": 305, "total_steps": 980, "loss": 0.0714, "lr": 8.713339810833105e-06, "epoch": 10.892857142857142, "percentage": 31.12, "elapsed_time": "0:21:08", "remaining_time": "0:46:47"}
{"current_steps": 306, "total_steps": 980, "loss": 0.0826, "lr": 8.701389985376578e-06, "epoch": 10.928571428571429, "percentage": 31.22, "elapsed_time": "0:21:12", "remaining_time": "0:46:42"}
{"current_steps": 307, "total_steps": 980, "loss": 0.0914, "lr": 8.689393200041878e-06, "epoch": 10.964285714285714, "percentage": 31.33, "elapsed_time": "0:21:15", "remaining_time": "0:46:35"}
{"current_steps": 308, "total_steps": 980, "loss": 0.0473, "lr": 8.677349607033336e-06, "epoch": 11.0, "percentage": 31.43, "elapsed_time": "0:21:19", "remaining_time": "0:46:31"}
{"current_steps": 309, "total_steps": 980, "loss": 0.0461, "lr": 8.665259359149132e-06, "epoch": 11.035714285714286, "percentage": 31.53, "elapsed_time": "0:21:23", "remaining_time": "0:46:27"}
{"current_steps": 310, "total_steps": 980, "loss": 0.0506, "lr": 8.653122609779365e-06, "epoch": 11.071428571428571, "percentage": 31.63, "elapsed_time": "0:21:26", "remaining_time": "0:46:21"}
{"current_steps": 311, "total_steps": 980, "loss": 0.044, "lr": 8.640939512904097e-06, "epoch": 11.107142857142858, "percentage": 31.73, "elapsed_time": "0:21:31", "remaining_time": "0:46:17"}
{"current_steps": 312, "total_steps": 980, "loss": 0.0442, "lr": 8.62871022309141e-06, "epoch": 11.142857142857142, "percentage": 31.84, "elapsed_time": "0:21:34", "remaining_time": "0:46:12"}
{"current_steps": 313, "total_steps": 980, "loss": 0.0356, "lr": 8.61643489549544e-06, "epoch": 11.178571428571429, "percentage": 31.94, "elapsed_time": "0:21:37", "remaining_time": "0:46:06"}
{"current_steps": 314, "total_steps": 980, "loss": 0.0465, "lr": 8.604113685854407e-06, "epoch": 11.214285714285714, "percentage": 32.04, "elapsed_time": "0:21:41", "remaining_time": "0:46:01"}
{"current_steps": 315, "total_steps": 980, "loss": 0.0485, "lr": 8.591746750488639e-06, "epoch": 11.25, "percentage": 32.14, "elapsed_time": "0:21:45", "remaining_time": "0:45:56"}
{"current_steps": 316, "total_steps": 980, "loss": 0.0623, "lr": 8.579334246298593e-06, "epoch": 11.285714285714286, "percentage": 32.24, "elapsed_time": "0:21:48", "remaining_time": "0:45:50"}
{"current_steps": 317, "total_steps": 980, "loss": 0.0485, "lr": 8.566876330762861e-06, "epoch": 11.321428571428571, "percentage": 32.35, "elapsed_time": "0:21:52", "remaining_time": "0:45:44"}
{"current_steps": 318, "total_steps": 980, "loss": 0.0549, "lr": 8.554373161936176e-06, "epoch": 11.357142857142858, "percentage": 32.45, "elapsed_time": "0:21:56", "remaining_time": "0:45:40"}
{"current_steps": 319, "total_steps": 980, "loss": 0.0419, "lr": 8.541824898447399e-06, "epoch": 11.392857142857142, "percentage": 32.55, "elapsed_time": "0:22:00", "remaining_time": "0:45:35"}
{"current_steps": 320, "total_steps": 980, "loss": 0.0538, "lr": 8.529231699497512e-06, "epoch": 11.428571428571429, "percentage": 32.65, "elapsed_time": "0:22:04", "remaining_time": "0:45:31"}
{"current_steps": 321, "total_steps": 980, "loss": 0.0476, "lr": 8.516593724857598e-06, "epoch": 11.464285714285714, "percentage": 32.76, "elapsed_time": "0:22:07", "remaining_time": "0:45:25"}
{"current_steps": 322, "total_steps": 980, "loss": 0.048, "lr": 8.503911134866819e-06, "epoch": 11.5, "percentage": 32.86, "elapsed_time": "0:22:11", "remaining_time": "0:45:21"}
{"current_steps": 323, "total_steps": 980, "loss": 0.052, "lr": 8.491184090430365e-06, "epoch": 11.535714285714286, "percentage": 32.96, "elapsed_time": "0:22:14", "remaining_time": "0:45:15"}
{"current_steps": 324, "total_steps": 980, "loss": 0.0451, "lr": 8.478412753017433e-06, "epoch": 11.571428571428571, "percentage": 33.06, "elapsed_time": "0:22:19", "remaining_time": "0:45:11"}
{"current_steps": 325, "total_steps": 980, "loss": 0.0511, "lr": 8.465597284659163e-06, "epoch": 11.607142857142858, "percentage": 33.16, "elapsed_time": "0:22:22", "remaining_time": "0:45:05"}
{"current_steps": 326, "total_steps": 980, "loss": 0.0612, "lr": 8.452737847946597e-06, "epoch": 11.642857142857142, "percentage": 33.27, "elapsed_time": "0:22:25", "remaining_time": "0:44:59"}
{"current_steps": 327, "total_steps": 980, "loss": 0.0663, "lr": 8.439834606028594e-06, "epoch": 11.678571428571429, "percentage": 33.37, "elapsed_time": "0:22:29", "remaining_time": "0:44:55"}
{"current_steps": 328, "total_steps": 980, "loss": 0.0538, "lr": 8.426887722609787e-06, "epoch": 11.714285714285714, "percentage": 33.47, "elapsed_time": "0:22:33", "remaining_time": "0:44:49"}
{"current_steps": 329, "total_steps": 980, "loss": 0.059, "lr": 8.413897361948484e-06, "epoch": 11.75, "percentage": 33.57, "elapsed_time": "0:22:36", "remaining_time": "0:44:43"}
{"current_steps": 330, "total_steps": 980, "loss": 0.0597, "lr": 8.400863688854598e-06, "epoch": 11.785714285714286, "percentage": 33.67, "elapsed_time": "0:22:39", "remaining_time": "0:44:38"}
{"current_steps": 331, "total_steps": 980, "loss": 0.0445, "lr": 8.387786868687549e-06, "epoch": 11.821428571428571, "percentage": 33.78, "elapsed_time": "0:22:43", "remaining_time": "0:44:34"}
{"current_steps": 332, "total_steps": 980, "loss": 0.0616, "lr": 8.374667067354164e-06, "epoch": 11.857142857142858, "percentage": 33.88, "elapsed_time": "0:22:47", "remaining_time": "0:44:28"}
{"current_steps": 333, "total_steps": 980, "loss": 0.0467, "lr": 8.361504451306585e-06, "epoch": 11.892857142857142, "percentage": 33.98, "elapsed_time": "0:22:50", "remaining_time": "0:44:23"}
{"current_steps": 334, "total_steps": 980, "loss": 0.0685, "lr": 8.34829918754014e-06, "epoch": 11.928571428571429, "percentage": 34.08, "elapsed_time": "0:22:54", "remaining_time": "0:44:17"}
{"current_steps": 335, "total_steps": 980, "loss": 0.0503, "lr": 8.335051443591236e-06, "epoch": 11.964285714285714, "percentage": 34.18, "elapsed_time": "0:22:58", "remaining_time": "0:44:13"}
{"current_steps": 336, "total_steps": 980, "loss": 0.0429, "lr": 8.321761387535231e-06, "epoch": 12.0, "percentage": 34.29, "elapsed_time": "0:23:02", "remaining_time": "0:44:10"}
{"current_steps": 337, "total_steps": 980, "loss": 0.033, "lr": 8.308429187984298e-06, "epoch": 12.035714285714286, "percentage": 34.39, "elapsed_time": "0:23:06", "remaining_time": "0:44:06"}
{"current_steps": 338, "total_steps": 980, "loss": 0.0379, "lr": 8.295055014085289e-06, "epoch": 12.071428571428571, "percentage": 34.49, "elapsed_time": "0:23:11", "remaining_time": "0:44:02"}
{"current_steps": 339, "total_steps": 980, "loss": 0.0423, "lr": 8.281639035517591e-06, "epoch": 12.107142857142858, "percentage": 34.59, "elapsed_time": "0:23:14", "remaining_time": "0:43:57"}
{"current_steps": 340, "total_steps": 980, "loss": 0.0284, "lr": 8.268181422490969e-06, "epoch": 12.142857142857142, "percentage": 34.69, "elapsed_time": "0:23:18", "remaining_time": "0:43:52"}
{"current_steps": 341, "total_steps": 980, "loss": 0.0302, "lr": 8.254682345743406e-06, "epoch": 12.178571428571429, "percentage": 34.8, "elapsed_time": "0:23:21", "remaining_time": "0:43:46"}
{"current_steps": 342, "total_steps": 980, "loss": 0.0341, "lr": 8.241141976538944e-06, "epoch": 12.214285714285714, "percentage": 34.9, "elapsed_time": "0:23:25", "remaining_time": "0:43:41"}
{"current_steps": 343, "total_steps": 980, "loss": 0.025, "lr": 8.227560486665498e-06, "epoch": 12.25, "percentage": 35.0, "elapsed_time": "0:23:28", "remaining_time": "0:43:35"}
{"current_steps": 344, "total_steps": 980, "loss": 0.0273, "lr": 8.213938048432697e-06, "epoch": 12.285714285714286, "percentage": 35.1, "elapsed_time": "0:23:31", "remaining_time": "0:43:30"}
{"current_steps": 345, "total_steps": 980, "loss": 0.0299, "lr": 8.200274834669675e-06, "epoch": 12.321428571428571, "percentage": 35.2, "elapsed_time": "0:23:35", "remaining_time": "0:43:26"}
{"current_steps": 346, "total_steps": 980, "loss": 0.0278, "lr": 8.186571018722894e-06, "epoch": 12.357142857142858, "percentage": 35.31, "elapsed_time": "0:23:39", "remaining_time": "0:43:20"}
{"current_steps": 347, "total_steps": 980, "loss": 0.037, "lr": 8.172826774453937e-06, "epoch": 12.392857142857142, "percentage": 35.41, "elapsed_time": "0:23:42", "remaining_time": "0:43:15"}
{"current_steps": 348, "total_steps": 980, "loss": 0.0457, "lr": 8.159042276237308e-06, "epoch": 12.428571428571429, "percentage": 35.51, "elapsed_time": "0:23:45", "remaining_time": "0:43:09"}
{"current_steps": 349, "total_steps": 980, "loss": 0.0334, "lr": 8.145217698958213e-06, "epoch": 12.464285714285714, "percentage": 35.61, "elapsed_time": "0:23:50", "remaining_time": "0:43:05"}
{"current_steps": 350, "total_steps": 980, "loss": 0.0381, "lr": 8.131353218010347e-06, "epoch": 12.5, "percentage": 35.71, "elapsed_time": "0:23:53", "remaining_time": "0:43:00"}
{"current_steps": 351, "total_steps": 980, "loss": 0.0331, "lr": 8.117449009293668e-06, "epoch": 12.535714285714286, "percentage": 35.82, "elapsed_time": "0:23:56", "remaining_time": "0:42:54"}
{"current_steps": 352, "total_steps": 980, "loss": 0.0379, "lr": 8.10350524921216e-06, "epoch": 12.571428571428571, "percentage": 35.92, "elapsed_time": "0:24:00", "remaining_time": "0:42:50"}
{"current_steps": 353, "total_steps": 980, "loss": 0.0349, "lr": 8.089522114671603e-06, "epoch": 12.607142857142858, "percentage": 36.02, "elapsed_time": "0:24:04", "remaining_time": "0:42:44"}
{"current_steps": 354, "total_steps": 980, "loss": 0.0354, "lr": 8.075499783077321e-06, "epoch": 12.642857142857142, "percentage": 36.12, "elapsed_time": "0:24:07", "remaining_time": "0:42:40"}
{"current_steps": 355, "total_steps": 980, "loss": 0.0358, "lr": 8.061438432331935e-06, "epoch": 12.678571428571429, "percentage": 36.22, "elapsed_time": "0:24:11", "remaining_time": "0:42:34"}
{"current_steps": 356, "total_steps": 980, "loss": 0.0485, "lr": 8.047338240833108e-06, "epoch": 12.714285714285714, "percentage": 36.33, "elapsed_time": "0:24:15", "remaining_time": "0:42:30"}
{"current_steps": 357, "total_steps": 980, "loss": 0.04, "lr": 8.033199387471278e-06, "epoch": 12.75, "percentage": 36.43, "elapsed_time": "0:24:18", "remaining_time": "0:42:25"}
{"current_steps": 358, "total_steps": 980, "loss": 0.0285, "lr": 8.019022051627387e-06, "epoch": 12.785714285714286, "percentage": 36.53, "elapsed_time": "0:24:22", "remaining_time": "0:42:21"}
{"current_steps": 359, "total_steps": 980, "loss": 0.0356, "lr": 8.004806413170613e-06, "epoch": 12.821428571428571, "percentage": 36.63, "elapsed_time": "0:24:26", "remaining_time": "0:42:16"}
{"current_steps": 360, "total_steps": 980, "loss": 0.0436, "lr": 7.99055265245608e-06, "epoch": 12.857142857142858, "percentage": 36.73, "elapsed_time": "0:24:29", "remaining_time": "0:42:11"}
{"current_steps": 361, "total_steps": 980, "loss": 0.0434, "lr": 7.976260950322572e-06, "epoch": 12.892857142857142, "percentage": 36.84, "elapsed_time": "0:24:33", "remaining_time": "0:42:06"}
{"current_steps": 362, "total_steps": 980, "loss": 0.0451, "lr": 7.96193148809024e-06, "epoch": 12.928571428571429, "percentage": 36.94, "elapsed_time": "0:24:36", "remaining_time": "0:42:00"}
{"current_steps": 363, "total_steps": 980, "loss": 0.0291, "lr": 7.9475644475583e-06, "epoch": 12.964285714285714, "percentage": 37.04, "elapsed_time": "0:24:39", "remaining_time": "0:41:55"}
{"current_steps": 364, "total_steps": 980, "loss": 0.0277, "lr": 7.933160011002729e-06, "epoch": 13.0, "percentage": 37.14, "elapsed_time": "0:24:43", "remaining_time": "0:41:51"}
{"current_steps": 365, "total_steps": 980, "loss": 0.02, "lr": 7.918718361173951e-06, "epoch": 13.035714285714286, "percentage": 37.24, "elapsed_time": "0:24:47", "remaining_time": "0:41:45"}
{"current_steps": 366, "total_steps": 980, "loss": 0.0185, "lr": 7.904239681294515e-06, "epoch": 13.071428571428571, "percentage": 37.35, "elapsed_time": "0:24:50", "remaining_time": "0:41:40"}
{"current_steps": 367, "total_steps": 980, "loss": 0.0195, "lr": 7.889724155056776e-06, "epoch": 13.107142857142858, "percentage": 37.45, "elapsed_time": "0:24:54", "remaining_time": "0:41:36"}
{"current_steps": 368, "total_steps": 980, "loss": 0.0266, "lr": 7.875171966620567e-06, "epoch": 13.142857142857142, "percentage": 37.55, "elapsed_time": "0:24:58", "remaining_time": "0:41:32"}
{"current_steps": 369, "total_steps": 980, "loss": 0.0193, "lr": 7.860583300610849e-06, "epoch": 13.178571428571429, "percentage": 37.65, "elapsed_time": "0:25:02", "remaining_time": "0:41:28"}
{"current_steps": 370, "total_steps": 980, "loss": 0.0213, "lr": 7.84595834211538e-06, "epoch": 13.214285714285714, "percentage": 37.76, "elapsed_time": "0:25:06", "remaining_time": "0:41:23"}
{"current_steps": 371, "total_steps": 980, "loss": 0.0235, "lr": 7.83129727668237e-06, "epoch": 13.25, "percentage": 37.86, "elapsed_time": "0:25:10", "remaining_time": "0:41:19"}
{"current_steps": 372, "total_steps": 980, "loss": 0.0254, "lr": 7.81660029031811e-06, "epoch": 13.285714285714286, "percentage": 37.96, "elapsed_time": "0:25:13", "remaining_time": "0:41:14"}
{"current_steps": 373, "total_steps": 980, "loss": 0.0255, "lr": 7.801867569484635e-06, "epoch": 13.321428571428571, "percentage": 38.06, "elapsed_time": "0:25:16", "remaining_time": "0:41:08"}
{"current_steps": 374, "total_steps": 980, "loss": 0.0277, "lr": 7.78709930109734e-06, "epoch": 13.357142857142858, "percentage": 38.16, "elapsed_time": "0:25:20", "remaining_time": "0:41:03"}
{"current_steps": 375, "total_steps": 980, "loss": 0.0285, "lr": 7.772295672522615e-06, "epoch": 13.392857142857142, "percentage": 38.27, "elapsed_time": "0:25:24", "remaining_time": "0:40:59"}
{"current_steps": 376, "total_steps": 980, "loss": 0.0236, "lr": 7.75745687157547e-06, "epoch": 13.428571428571429, "percentage": 38.37, "elapsed_time": "0:25:28", "remaining_time": "0:40:55"}
{"current_steps": 377, "total_steps": 980, "loss": 0.0184, "lr": 7.742583086517151e-06, "epoch": 13.464285714285714, "percentage": 38.47, "elapsed_time": "0:25:32", "remaining_time": "0:40:51"}
{"current_steps": 378, "total_steps": 980, "loss": 0.026, "lr": 7.727674506052744e-06, "epoch": 13.5, "percentage": 38.57, "elapsed_time": "0:25:36", "remaining_time": "0:40:47"}
{"current_steps": 379, "total_steps": 980, "loss": 0.0251, "lr": 7.712731319328798e-06, "epoch": 13.535714285714286, "percentage": 38.67, "elapsed_time": "0:25:39", "remaining_time": "0:40:41"}
{"current_steps": 380, "total_steps": 980, "loss": 0.0224, "lr": 7.697753715930906e-06, "epoch": 13.571428571428571, "percentage": 38.78, "elapsed_time": "0:25:43", "remaining_time": "0:40:36"}
{"current_steps": 381, "total_steps": 980, "loss": 0.0261, "lr": 7.682741885881314e-06, "epoch": 13.607142857142858, "percentage": 38.88, "elapsed_time": "0:25:47", "remaining_time": "0:40:32"}
{"current_steps": 382, "total_steps": 980, "loss": 0.0418, "lr": 7.667696019636504e-06, "epoch": 13.642857142857142, "percentage": 38.98, "elapsed_time": "0:25:50", "remaining_time": "0:40:26"}
{"current_steps": 383, "total_steps": 980, "loss": 0.0296, "lr": 7.652616308084774e-06, "epoch": 13.678571428571429, "percentage": 39.08, "elapsed_time": "0:25:53", "remaining_time": "0:40:21"}
{"current_steps": 384, "total_steps": 980, "loss": 0.0345, "lr": 7.637502942543825e-06, "epoch": 13.714285714285714, "percentage": 39.18, "elapsed_time": "0:25:57", "remaining_time": "0:40:17"}
{"current_steps": 385, "total_steps": 980, "loss": 0.0374, "lr": 7.622356114758328e-06, "epoch": 13.75, "percentage": 39.29, "elapsed_time": "0:26:01", "remaining_time": "0:40:13"}
{"current_steps": 386, "total_steps": 980, "loss": 0.0335, "lr": 7.607176016897491e-06, "epoch": 13.785714285714286, "percentage": 39.39, "elapsed_time": "0:26:05", "remaining_time": "0:40:09"}
{"current_steps": 387, "total_steps": 980, "loss": 0.0312, "lr": 7.591962841552627e-06, "epoch": 13.821428571428571, "percentage": 39.49, "elapsed_time": "0:26:08", "remaining_time": "0:40:04"}
{"current_steps": 388, "total_steps": 980, "loss": 0.0306, "lr": 7.576716781734699e-06, "epoch": 13.857142857142858, "percentage": 39.59, "elapsed_time": "0:26:12", "remaining_time": "0:39:58"}
{"current_steps": 389, "total_steps": 980, "loss": 0.0248, "lr": 7.561438030871886e-06, "epoch": 13.892857142857142, "percentage": 39.69, "elapsed_time": "0:26:16", "remaining_time": "0:39:54"}
{"current_steps": 390, "total_steps": 980, "loss": 0.0243, "lr": 7.546126782807117e-06, "epoch": 13.928571428571429, "percentage": 39.8, "elapsed_time": "0:26:19", "remaining_time": "0:39:49"}
{"current_steps": 391, "total_steps": 980, "loss": 0.0276, "lr": 7.530783231795615e-06, "epoch": 13.964285714285714, "percentage": 39.9, "elapsed_time": "0:26:23", "remaining_time": "0:39:44"}
{"current_steps": 392, "total_steps": 980, "loss": 0.016, "lr": 7.515407572502438e-06, "epoch": 14.0, "percentage": 40.0, "elapsed_time": "0:26:26", "remaining_time": "0:39:39"}
{"current_steps": 393, "total_steps": 980, "loss": 0.0185, "lr": 7.500000000000001e-06, "epoch": 14.035714285714286, "percentage": 40.1, "elapsed_time": "0:26:29", "remaining_time": "0:39:34"}
{"current_steps": 394, "total_steps": 980, "loss": 0.0171, "lr": 7.484560709765605e-06, "epoch": 14.071428571428571, "percentage": 40.2, "elapsed_time": "0:26:33", "remaining_time": "0:39:30"}
{"current_steps": 395, "total_steps": 980, "loss": 0.0227, "lr": 7.469089897678958e-06, "epoch": 14.107142857142858, "percentage": 40.31, "elapsed_time": "0:26:37", "remaining_time": "0:39:25"}
{"current_steps": 396, "total_steps": 980, "loss": 0.0308, "lr": 7.453587760019691e-06, "epoch": 14.142857142857142, "percentage": 40.41, "elapsed_time": "0:26:41", "remaining_time": "0:39:22"}
{"current_steps": 397, "total_steps": 980, "loss": 0.016, "lr": 7.438054493464859e-06, "epoch": 14.178571428571429, "percentage": 40.51, "elapsed_time": "0:26:45", "remaining_time": "0:39:17"}
{"current_steps": 398, "total_steps": 980, "loss": 0.0219, "lr": 7.422490295086457e-06, "epoch": 14.214285714285714, "percentage": 40.61, "elapsed_time": "0:26:49", "remaining_time": "0:39:13"}
{"current_steps": 399, "total_steps": 980, "loss": 0.0165, "lr": 7.406895362348916e-06, "epoch": 14.25, "percentage": 40.71, "elapsed_time": "0:26:52", "remaining_time": "0:39:08"}
{"current_steps": 400, "total_steps": 980, "loss": 0.0219, "lr": 7.391269893106592e-06, "epoch": 14.285714285714286, "percentage": 40.82, "elapsed_time": "0:26:56", "remaining_time": "0:39:03"}
{"current_steps": 400, "total_steps": 980, "eval_loss": 2.3083860874176025, "epoch": 14.285714285714286, "percentage": 40.82, "elapsed_time": "0:26:56", "remaining_time": "0:39:04"}
{"current_steps": 401, "total_steps": 980, "loss": 0.0188, "lr": 7.375614085601265e-06, "epoch": 14.321428571428571, "percentage": 40.92, "elapsed_time": "0:27:46", "remaining_time": "0:40:05"}
{"current_steps": 402, "total_steps": 980, "loss": 0.0194, "lr": 7.359928138459615e-06, "epoch": 14.357142857142858, "percentage": 41.02, "elapsed_time": "0:27:50", "remaining_time": "0:40:01"}
{"current_steps": 403, "total_steps": 980, "loss": 0.0195, "lr": 7.344212250690712e-06, "epoch": 14.392857142857142, "percentage": 41.12, "elapsed_time": "0:27:54", "remaining_time": "0:39:56"}
{"current_steps": 404, "total_steps": 980, "loss": 0.0199, "lr": 7.328466621683481e-06, "epoch": 14.428571428571429, "percentage": 41.22, "elapsed_time": "0:27:57", "remaining_time": "0:39:52"}
{"current_steps": 405, "total_steps": 980, "loss": 0.0182, "lr": 7.312691451204178e-06, "epoch": 14.464285714285714, "percentage": 41.33, "elapsed_time": "0:28:01", "remaining_time": "0:39:47"}
{"current_steps": 406, "total_steps": 980, "loss": 0.0241, "lr": 7.296886939393852e-06, "epoch": 14.5, "percentage": 41.43, "elapsed_time": "0:28:05", "remaining_time": "0:39:43"}
{"current_steps": 407, "total_steps": 980, "loss": 0.0154, "lr": 7.281053286765816e-06, "epoch": 14.535714285714286, "percentage": 41.53, "elapsed_time": "0:28:09", "remaining_time": "0:39:38"}
{"current_steps": 408, "total_steps": 980, "loss": 0.0212, "lr": 7.265190694203086e-06, "epoch": 14.571428571428571, "percentage": 41.63, "elapsed_time": "0:28:13", "remaining_time": "0:39:33"}
{"current_steps": 409, "total_steps": 980, "loss": 0.0254, "lr": 7.249299362955846e-06, "epoch": 14.607142857142858, "percentage": 41.73, "elapsed_time": "0:28:16", "remaining_time": "0:39:28"}
{"current_steps": 410, "total_steps": 980, "loss": 0.0216, "lr": 7.233379494638891e-06, "epoch": 14.642857142857142, "percentage": 41.84, "elapsed_time": "0:28:20", "remaining_time": "0:39:23"}
{"current_steps": 411, "total_steps": 980, "loss": 0.0173, "lr": 7.217431291229068e-06, "epoch": 14.678571428571429, "percentage": 41.94, "elapsed_time": "0:28:24", "remaining_time": "0:39:19"}
{"current_steps": 412, "total_steps": 980, "loss": 0.0169, "lr": 7.201454955062712e-06, "epoch": 14.714285714285714, "percentage": 42.04, "elapsed_time": "0:28:27", "remaining_time": "0:39:13"}
{"current_steps": 413, "total_steps": 980, "loss": 0.0229, "lr": 7.185450688833083e-06, "epoch": 14.75, "percentage": 42.14, "elapsed_time": "0:28:30", "remaining_time": "0:39:08"}
{"current_steps": 414, "total_steps": 980, "loss": 0.0196, "lr": 7.169418695587791e-06, "epoch": 14.785714285714286, "percentage": 42.24, "elapsed_time": "0:28:34", "remaining_time": "0:39:04"}
{"current_steps": 415, "total_steps": 980, "loss": 0.0239, "lr": 7.153359178726222e-06, "epoch": 14.821428571428571, "percentage": 42.35, "elapsed_time": "0:28:37", "remaining_time": "0:38:58"}
{"current_steps": 416, "total_steps": 980, "loss": 0.0241, "lr": 7.137272341996958e-06, "epoch": 14.857142857142858, "percentage": 42.45, "elapsed_time": "0:28:41", "remaining_time": "0:38:54"}
{"current_steps": 417, "total_steps": 980, "loss": 0.0232, "lr": 7.121158389495187e-06, "epoch": 14.892857142857142, "percentage": 42.55, "elapsed_time": "0:28:45", "remaining_time": "0:38:49"}
{"current_steps": 418, "total_steps": 980, "loss": 0.0225, "lr": 7.10501752566012e-06, "epoch": 14.928571428571429, "percentage": 42.65, "elapsed_time": "0:28:48", "remaining_time": "0:38:44"}
{"current_steps": 419, "total_steps": 980, "loss": 0.0246, "lr": 7.088849955272396e-06, "epoch": 14.964285714285714, "percentage": 42.76, "elapsed_time": "0:28:52", "remaining_time": "0:38:40"}
{"current_steps": 420, "total_steps": 980, "loss": 0.0183, "lr": 7.072655883451478e-06, "epoch": 15.0, "percentage": 42.86, "elapsed_time": "0:28:56", "remaining_time": "0:38:34"}
{"current_steps": 421, "total_steps": 980, "loss": 0.0147, "lr": 7.056435515653059e-06, "epoch": 15.035714285714286, "percentage": 42.96, "elapsed_time": "0:28:59", "remaining_time": "0:38:30"}
{"current_steps": 422, "total_steps": 980, "loss": 0.0162, "lr": 7.040189057666449e-06, "epoch": 15.071428571428571, "percentage": 43.06, "elapsed_time": "0:29:03", "remaining_time": "0:38:25"}
{"current_steps": 423, "total_steps": 980, "loss": 0.0152, "lr": 7.023916715611969e-06, "epoch": 15.107142857142858, "percentage": 43.16, "elapsed_time": "0:29:06", "remaining_time": "0:38:20"}
{"current_steps": 424, "total_steps": 980, "loss": 0.0126, "lr": 7.007618695938334e-06, "epoch": 15.142857142857142, "percentage": 43.27, "elapsed_time": "0:29:10", "remaining_time": "0:38:15"}
{"current_steps": 425, "total_steps": 980, "loss": 0.0133, "lr": 6.991295205420028e-06, "epoch": 15.178571428571429, "percentage": 43.37, "elapsed_time": "0:29:14", "remaining_time": "0:38:11"}
{"current_steps": 426, "total_steps": 980, "loss": 0.0134, "lr": 6.974946451154694e-06, "epoch": 15.214285714285714, "percentage": 43.47, "elapsed_time": "0:29:17", "remaining_time": "0:38:06"}
{"current_steps": 427, "total_steps": 980, "loss": 0.0159, "lr": 6.9585726405604915e-06, "epoch": 15.25, "percentage": 43.57, "elapsed_time": "0:29:21", "remaining_time": "0:38:00"}
{"current_steps": 428, "total_steps": 980, "loss": 0.0141, "lr": 6.942173981373474e-06, "epoch": 15.285714285714286, "percentage": 43.67, "elapsed_time": "0:29:24", "remaining_time": "0:37:55"}
{"current_steps": 429, "total_steps": 980, "loss": 0.0145, "lr": 6.925750681644954e-06, "epoch": 15.321428571428571, "percentage": 43.78, "elapsed_time": "0:29:28", "remaining_time": "0:37:51"}
{"current_steps": 430, "total_steps": 980, "loss": 0.0158, "lr": 6.90930294973886e-06, "epoch": 15.357142857142858, "percentage": 43.88, "elapsed_time": "0:29:32", "remaining_time": "0:37:47"}
{"current_steps": 431, "total_steps": 980, "loss": 0.0187, "lr": 6.892830994329089e-06, "epoch": 15.392857142857142, "percentage": 43.98, "elapsed_time": "0:29:36", "remaining_time": "0:37:43"}
{"current_steps": 432, "total_steps": 980, "loss": 0.0141, "lr": 6.876335024396872e-06, "epoch": 15.428571428571429, "percentage": 44.08, "elapsed_time": "0:29:39", "remaining_time": "0:37:37"}
{"current_steps": 433, "total_steps": 980, "loss": 0.0206, "lr": 6.859815249228106e-06, "epoch": 15.464285714285714, "percentage": 44.18, "elapsed_time": "0:29:43", "remaining_time": "0:37:32"}
{"current_steps": 434, "total_steps": 980, "loss": 0.0145, "lr": 6.8432718784107145e-06, "epoch": 15.5, "percentage": 44.29, "elapsed_time": "0:29:47", "remaining_time": "0:37:28"}
{"current_steps": 435, "total_steps": 980, "loss": 0.0168, "lr": 6.8267051218319766e-06, "epoch": 15.535714285714286, "percentage": 44.39, "elapsed_time": "0:29:50", "remaining_time": "0:37:23"}
{"current_steps": 436, "total_steps": 980, "loss": 0.0184, "lr": 6.81011518967587e-06, "epoch": 15.571428571428571, "percentage": 44.49, "elapsed_time": "0:29:53", "remaining_time": "0:37:17"}
{"current_steps": 437, "total_steps": 980, "loss": 0.0191, "lr": 6.793502292420402e-06, "epoch": 15.607142857142858, "percentage": 44.59, "elapsed_time": "0:29:56", "remaining_time": "0:37:12"}
{"current_steps": 438, "total_steps": 980, "loss": 0.0118, "lr": 6.7768666408349445e-06, "epoch": 15.642857142857142, "percentage": 44.69, "elapsed_time": "0:30:00", "remaining_time": "0:37:07"}
{"current_steps": 439, "total_steps": 980, "loss": 0.0201, "lr": 6.760208445977551e-06, "epoch": 15.678571428571429, "percentage": 44.8, "elapsed_time": "0:30:03", "remaining_time": "0:37:02"}
{"current_steps": 440, "total_steps": 980, "loss": 0.0183, "lr": 6.743527919192285e-06, "epoch": 15.714285714285714, "percentage": 44.9, "elapsed_time": "0:30:07", "remaining_time": "0:36:58"}
{"current_steps": 441, "total_steps": 980, "loss": 0.0172, "lr": 6.726825272106539e-06, "epoch": 15.75, "percentage": 45.0, "elapsed_time": "0:30:11", "remaining_time": "0:36:53"}
{"current_steps": 442, "total_steps": 980, "loss": 0.0202, "lr": 6.710100716628345e-06, "epoch": 15.785714285714286, "percentage": 45.1, "elapsed_time": "0:30:15", "remaining_time": "0:36:49"}
{"current_steps": 443, "total_steps": 980, "loss": 0.0175, "lr": 6.693354464943689e-06, "epoch": 15.821428571428571, "percentage": 45.2, "elapsed_time": "0:30:19", "remaining_time": "0:36:45"}
{"current_steps": 444, "total_steps": 980, "loss": 0.0205, "lr": 6.676586729513823e-06, "epoch": 15.857142857142858, "percentage": 45.31, "elapsed_time": "0:30:22", "remaining_time": "0:36:40"}
{"current_steps": 445, "total_steps": 980, "loss": 0.0206, "lr": 6.659797723072558e-06, "epoch": 15.892857142857142, "percentage": 45.41, "elapsed_time": "0:30:27", "remaining_time": "0:36:36"}
{"current_steps": 446, "total_steps": 980, "loss": 0.0207, "lr": 6.642987658623581e-06, "epoch": 15.928571428571429, "percentage": 45.51, "elapsed_time": "0:30:30", "remaining_time": "0:36:31"}
{"current_steps": 447, "total_steps": 980, "loss": 0.0216, "lr": 6.626156749437736e-06, "epoch": 15.964285714285714, "percentage": 45.61, "elapsed_time": "0:30:33", "remaining_time": "0:36:26"}
{"current_steps": 448, "total_steps": 980, "loss": 0.0178, "lr": 6.609305209050332e-06, "epoch": 16.0, "percentage": 45.71, "elapsed_time": "0:30:37", "remaining_time": "0:36:22"}
{"current_steps": 449, "total_steps": 980, "loss": 0.0132, "lr": 6.592433251258423e-06, "epoch": 16.035714285714285, "percentage": 45.82, "elapsed_time": "0:30:40", "remaining_time": "0:36:17"}
{"current_steps": 450, "total_steps": 980, "loss": 0.0142, "lr": 6.575541090118105e-06, "epoch": 16.071428571428573, "percentage": 45.92, "elapsed_time": "0:30:44", "remaining_time": "0:36:12"}
{"current_steps": 451, "total_steps": 980, "loss": 0.0139, "lr": 6.558628939941792e-06, "epoch": 16.107142857142858, "percentage": 46.02, "elapsed_time": "0:30:47", "remaining_time": "0:36:07"}
{"current_steps": 452, "total_steps": 980, "loss": 0.0147, "lr": 6.541697015295503e-06, "epoch": 16.142857142857142, "percentage": 46.12, "elapsed_time": "0:30:51", "remaining_time": "0:36:02"}
{"current_steps": 453, "total_steps": 980, "loss": 0.0112, "lr": 6.524745530996137e-06, "epoch": 16.178571428571427, "percentage": 46.22, "elapsed_time": "0:30:54", "remaining_time": "0:35:57"}
{"current_steps": 454, "total_steps": 980, "loss": 0.0138, "lr": 6.507774702108748e-06, "epoch": 16.214285714285715, "percentage": 46.33, "elapsed_time": "0:30:58", "remaining_time": "0:35:53"}
{"current_steps": 455, "total_steps": 980, "loss": 0.0111, "lr": 6.490784743943819e-06, "epoch": 16.25, "percentage": 46.43, "elapsed_time": "0:31:02", "remaining_time": "0:35:48"}
{"current_steps": 456, "total_steps": 980, "loss": 0.0149, "lr": 6.473775872054522e-06, "epoch": 16.285714285714285, "percentage": 46.53, "elapsed_time": "0:31:05", "remaining_time": "0:35:43"}
{"current_steps": 457, "total_steps": 980, "loss": 0.0134, "lr": 6.456748302233995e-06, "epoch": 16.321428571428573, "percentage": 46.63, "elapsed_time": "0:31:09", "remaining_time": "0:35:39"}
{"current_steps": 458, "total_steps": 980, "loss": 0.0153, "lr": 6.439702250512596e-06, "epoch": 16.357142857142858, "percentage": 46.73, "elapsed_time": "0:31:13", "remaining_time": "0:35:35"}
{"current_steps": 459, "total_steps": 980, "loss": 0.0133, "lr": 6.4226379331551625e-06, "epoch": 16.392857142857142, "percentage": 46.84, "elapsed_time": "0:31:17", "remaining_time": "0:35:31"}
{"current_steps": 460, "total_steps": 980, "loss": 0.0172, "lr": 6.405555566658276e-06, "epoch": 16.428571428571427, "percentage": 46.94, "elapsed_time": "0:31:21", "remaining_time": "0:35:26"}
{"current_steps": 461, "total_steps": 980, "loss": 0.013, "lr": 6.388455367747503e-06, "epoch": 16.464285714285715, "percentage": 47.04, "elapsed_time": "0:31:24", "remaining_time": "0:35:22"}
{"current_steps": 462, "total_steps": 980, "loss": 0.0133, "lr": 6.3713375533746525e-06, "epoch": 16.5, "percentage": 47.14, "elapsed_time": "0:31:28", "remaining_time": "0:35:17"}
{"current_steps": 463, "total_steps": 980, "loss": 0.0143, "lr": 6.354202340715027e-06, "epoch": 16.535714285714285, "percentage": 47.24, "elapsed_time": "0:31:32", "remaining_time": "0:35:13"}
{"current_steps": 464, "total_steps": 980, "loss": 0.0153, "lr": 6.337049947164656e-06, "epoch": 16.571428571428573, "percentage": 47.35, "elapsed_time": "0:31:36", "remaining_time": "0:35:09"}
{"current_steps": 465, "total_steps": 980, "loss": 0.0173, "lr": 6.319880590337549e-06, "epoch": 16.607142857142858, "percentage": 47.45, "elapsed_time": "0:31:40", "remaining_time": "0:35:05"}
{"current_steps": 466, "total_steps": 980, "loss": 0.0185, "lr": 6.302694488062931e-06, "epoch": 16.642857142857142, "percentage": 47.55, "elapsed_time": "0:31:43", "remaining_time": "0:35:00"}
{"current_steps": 467, "total_steps": 980, "loss": 0.014, "lr": 6.2854918583824745e-06, "epoch": 16.678571428571427, "percentage": 47.65, "elapsed_time": "0:31:47", "remaining_time": "0:34:55"}
{"current_steps": 468, "total_steps": 980, "loss": 0.0172, "lr": 6.268272919547537e-06, "epoch": 16.714285714285715, "percentage": 47.76, "elapsed_time": "0:31:51", "remaining_time": "0:34:50"}
{"current_steps": 469, "total_steps": 980, "loss": 0.0128, "lr": 6.251037890016396e-06, "epoch": 16.75, "percentage": 47.86, "elapsed_time": "0:31:54", "remaining_time": "0:34:45"}
{"current_steps": 470, "total_steps": 980, "loss": 0.0148, "lr": 6.233786988451468e-06, "epoch": 16.785714285714285, "percentage": 47.96, "elapsed_time": "0:31:58", "remaining_time": "0:34:41"}
{"current_steps": 471, "total_steps": 980, "loss": 0.0188, "lr": 6.216520433716544e-06, "epoch": 16.821428571428573, "percentage": 48.06, "elapsed_time": "0:32:01", "remaining_time": "0:34:37"}
{"current_steps": 472, "total_steps": 980, "loss": 0.0172, "lr": 6.199238444874005e-06, "epoch": 16.857142857142858, "percentage": 48.16, "elapsed_time": "0:32:05", "remaining_time": "0:34:32"}
{"current_steps": 473, "total_steps": 980, "loss": 0.0149, "lr": 6.181941241182044e-06, "epoch": 16.892857142857142, "percentage": 48.27, "elapsed_time": "0:32:08", "remaining_time": "0:34:27"}
{"current_steps": 474, "total_steps": 980, "loss": 0.0159, "lr": 6.164629042091894e-06, "epoch": 16.928571428571427, "percentage": 48.37, "elapsed_time": "0:32:12", "remaining_time": "0:34:23"}
{"current_steps": 475, "total_steps": 980, "loss": 0.0175, "lr": 6.1473020672450275e-06, "epoch": 16.964285714285715, "percentage": 48.47, "elapsed_time": "0:32:17", "remaining_time": "0:34:19"}
{"current_steps": 476, "total_steps": 980, "loss": 0.0137, "lr": 6.1299605364703826e-06, "epoch": 17.0, "percentage": 48.57, "elapsed_time": "0:32:20", "remaining_time": "0:34:14"}
{"current_steps": 477, "total_steps": 980, "loss": 0.0126, "lr": 6.112604669781572e-06, "epoch": 17.035714285714285, "percentage": 48.67, "elapsed_time": "0:32:23", "remaining_time": "0:34:09"}
{"current_steps": 478, "total_steps": 980, "loss": 0.0111, "lr": 6.095234687374085e-06, "epoch": 17.071428571428573, "percentage": 48.78, "elapsed_time": "0:32:27", "remaining_time": "0:34:04"}
{"current_steps": 479, "total_steps": 980, "loss": 0.014, "lr": 6.0778508096224985e-06, "epoch": 17.107142857142858, "percentage": 48.88, "elapsed_time": "0:32:31", "remaining_time": "0:34:00"}
{"current_steps": 480, "total_steps": 980, "loss": 0.011, "lr": 6.060453257077686e-06, "epoch": 17.142857142857142, "percentage": 48.98, "elapsed_time": "0:32:35", "remaining_time": "0:33:56"}
{"current_steps": 481, "total_steps": 980, "loss": 0.0113, "lr": 6.043042250464005e-06, "epoch": 17.178571428571427, "percentage": 49.08, "elapsed_time": "0:32:39", "remaining_time": "0:33:52"}
{"current_steps": 482, "total_steps": 980, "loss": 0.0076, "lr": 6.025618010676516e-06, "epoch": 17.214285714285715, "percentage": 49.18, "elapsed_time": "0:32:42", "remaining_time": "0:33:47"}
{"current_steps": 483, "total_steps": 980, "loss": 0.0116, "lr": 6.008180758778167e-06, "epoch": 17.25, "percentage": 49.29, "elapsed_time": "0:32:45", "remaining_time": "0:33:42"}
{"current_steps": 484, "total_steps": 980, "loss": 0.0152, "lr": 5.990730715996989e-06, "epoch": 17.285714285714285, "percentage": 49.39, "elapsed_time": "0:32:49", "remaining_time": "0:33:37"}
{"current_steps": 485, "total_steps": 980, "loss": 0.0116, "lr": 5.973268103723293e-06, "epoch": 17.321428571428573, "percentage": 49.49, "elapsed_time": "0:32:53", "remaining_time": "0:33:34"}
{"current_steps": 486, "total_steps": 980, "loss": 0.0108, "lr": 5.955793143506863e-06, "epoch": 17.357142857142858, "percentage": 49.59, "elapsed_time": "0:32:56", "remaining_time": "0:33:29"}
{"current_steps": 487, "total_steps": 980, "loss": 0.0094, "lr": 5.938306057054139e-06, "epoch": 17.392857142857142, "percentage": 49.69, "elapsed_time": "0:33:00", "remaining_time": "0:33:24"}
{"current_steps": 488, "total_steps": 980, "loss": 0.0135, "lr": 5.920807066225409e-06, "epoch": 17.428571428571427, "percentage": 49.8, "elapsed_time": "0:33:03", "remaining_time": "0:33:19"}
{"current_steps": 489, "total_steps": 980, "loss": 0.0109, "lr": 5.903296393031996e-06, "epoch": 17.464285714285715, "percentage": 49.9, "elapsed_time": "0:33:07", "remaining_time": "0:33:15"}
{"current_steps": 490, "total_steps": 980, "loss": 0.0151, "lr": 5.885774259633432e-06, "epoch": 17.5, "percentage": 50.0, "elapsed_time": "0:33:10", "remaining_time": "0:33:10"}
{"current_steps": 491, "total_steps": 980, "loss": 0.0104, "lr": 5.8682408883346535e-06, "epoch": 17.535714285714285, "percentage": 50.1, "elapsed_time": "0:33:14", "remaining_time": "0:33:06"}
{"current_steps": 492, "total_steps": 980, "loss": 0.0145, "lr": 5.850696501583164e-06, "epoch": 17.571428571428573, "percentage": 50.2, "elapsed_time": "0:33:17", "remaining_time": "0:33:01"}
{"current_steps": 493, "total_steps": 980, "loss": 0.0153, "lr": 5.8331413219662295e-06, "epoch": 17.607142857142858, "percentage": 50.31, "elapsed_time": "0:33:21", "remaining_time": "0:32:57"}
{"current_steps": 494, "total_steps": 980, "loss": 0.018, "lr": 5.815575572208042e-06, "epoch": 17.642857142857142, "percentage": 50.41, "elapsed_time": "0:33:24", "remaining_time": "0:32:52"}
{"current_steps": 495, "total_steps": 980, "loss": 0.017, "lr": 5.797999475166897e-06, "epoch": 17.678571428571427, "percentage": 50.51, "elapsed_time": "0:33:28", "remaining_time": "0:32:48"}
{"current_steps": 496, "total_steps": 980, "loss": 0.0152, "lr": 5.78041325383237e-06, "epoch": 17.714285714285715, "percentage": 50.61, "elapsed_time": "0:33:32", "remaining_time": "0:32:43"}
{"current_steps": 497, "total_steps": 980, "loss": 0.0143, "lr": 5.762817131322482e-06, "epoch": 17.75, "percentage": 50.71, "elapsed_time": "0:33:36", "remaining_time": "0:32:39"}
{"current_steps": 498, "total_steps": 980, "loss": 0.0153, "lr": 5.745211330880872e-06, "epoch": 17.785714285714285, "percentage": 50.82, "elapsed_time": "0:33:40", "remaining_time": "0:32:35"}
{"current_steps": 499, "total_steps": 980, "loss": 0.014, "lr": 5.7275960758739655e-06, "epoch": 17.821428571428573, "percentage": 50.92, "elapsed_time": "0:33:44", "remaining_time": "0:32:31"}
{"current_steps": 500, "total_steps": 980, "loss": 0.0181, "lr": 5.709971589788136e-06, "epoch": 17.857142857142858, "percentage": 51.02, "elapsed_time": "0:33:47", "remaining_time": "0:32:26"}
{"current_steps": 500, "total_steps": 980, "eval_loss": 2.345672607421875, "epoch": 17.857142857142858, "percentage": 51.02, "elapsed_time": "0:33:48", "remaining_time": "0:32:27"}
{"current_steps": 501, "total_steps": 980, "loss": 0.0181, "lr": 5.69233809622687e-06, "epoch": 17.892857142857142, "percentage": 51.12, "elapsed_time": "0:34:38", "remaining_time": "0:33:07"}
{"current_steps": 502, "total_steps": 980, "loss": 0.0161, "lr": 5.674695818907943e-06, "epoch": 17.928571428571427, "percentage": 51.22, "elapsed_time": "0:34:42", "remaining_time": "0:33:03"}
{"current_steps": 503, "total_steps": 980, "loss": 0.0176, "lr": 5.65704498166056e-06, "epoch": 17.964285714285715, "percentage": 51.33, "elapsed_time": "0:34:46", "remaining_time": "0:32:58"}
{"current_steps": 504, "total_steps": 980, "loss": 0.0129, "lr": 5.6393858084225305e-06, "epoch": 18.0, "percentage": 51.43, "elapsed_time": "0:34:49", "remaining_time": "0:32:53"}
{"current_steps": 505, "total_steps": 980, "loss": 0.0088, "lr": 5.621718523237427e-06, "epoch": 18.035714285714285, "percentage": 51.53, "elapsed_time": "0:34:54", "remaining_time": "0:32:49"}
{"current_steps": 506, "total_steps": 980, "loss": 0.0099, "lr": 5.604043350251733e-06, "epoch": 18.071428571428573, "percentage": 51.63, "elapsed_time": "0:34:57", "remaining_time": "0:32:44"}
{"current_steps": 507, "total_steps": 980, "loss": 0.0117, "lr": 5.586360513712011e-06, "epoch": 18.107142857142858, "percentage": 51.73, "elapsed_time": "0:35:00", "remaining_time": "0:32:39"}
{"current_steps": 508, "total_steps": 980, "loss": 0.009, "lr": 5.568670237962045e-06, "epoch": 18.142857142857142, "percentage": 51.84, "elapsed_time": "0:35:04", "remaining_time": "0:32:35"}
{"current_steps": 509, "total_steps": 980, "loss": 0.0124, "lr": 5.550972747440007e-06, "epoch": 18.178571428571427, "percentage": 51.94, "elapsed_time": "0:35:08", "remaining_time": "0:32:30"}
{"current_steps": 510, "total_steps": 980, "loss": 0.0128, "lr": 5.533268266675601e-06, "epoch": 18.214285714285715, "percentage": 52.04, "elapsed_time": "0:35:12", "remaining_time": "0:32:26"}
{"current_steps": 511, "total_steps": 980, "loss": 0.0078, "lr": 5.515557020287219e-06, "epoch": 18.25, "percentage": 52.14, "elapsed_time": "0:35:15", "remaining_time": "0:32:21"}
{"current_steps": 512, "total_steps": 980, "loss": 0.0119, "lr": 5.497839232979084e-06, "epoch": 18.285714285714285, "percentage": 52.24, "elapsed_time": "0:35:18", "remaining_time": "0:32:16"}
{"current_steps": 513, "total_steps": 980, "loss": 0.0152, "lr": 5.480115129538409e-06, "epoch": 18.321428571428573, "percentage": 52.35, "elapsed_time": "0:35:21", "remaining_time": "0:32:11"}
{"current_steps": 514, "total_steps": 980, "loss": 0.0102, "lr": 5.4623849348325396e-06, "epoch": 18.357142857142858, "percentage": 52.45, "elapsed_time": "0:35:26", "remaining_time": "0:32:07"}
{"current_steps": 515, "total_steps": 980, "loss": 0.0122, "lr": 5.444648873806101e-06, "epoch": 18.392857142857142, "percentage": 52.55, "elapsed_time": "0:35:30", "remaining_time": "0:32:03"}
{"current_steps": 516, "total_steps": 980, "loss": 0.0099, "lr": 5.426907171478143e-06, "epoch": 18.428571428571427, "percentage": 52.65, "elapsed_time": "0:35:34", "remaining_time": "0:31:59"}
{"current_steps": 517, "total_steps": 980, "loss": 0.0133, "lr": 5.409160052939292e-06, "epoch": 18.464285714285715, "percentage": 52.76, "elapsed_time": "0:35:37", "remaining_time": "0:31:54"}
{"current_steps": 518, "total_steps": 980, "loss": 0.0165, "lr": 5.391407743348884e-06, "epoch": 18.5, "percentage": 52.86, "elapsed_time": "0:35:41", "remaining_time": "0:31:49"}
{"current_steps": 519, "total_steps": 980, "loss": 0.0121, "lr": 5.373650467932122e-06, "epoch": 18.535714285714285, "percentage": 52.96, "elapsed_time": "0:35:44", "remaining_time": "0:31:45"}
{"current_steps": 520, "total_steps": 980, "loss": 0.0163, "lr": 5.355888451977204e-06, "epoch": 18.571428571428573, "percentage": 53.06, "elapsed_time": "0:35:48", "remaining_time": "0:31:40"}
{"current_steps": 521, "total_steps": 980, "loss": 0.0141, "lr": 5.3381219208324755e-06, "epoch": 18.607142857142858, "percentage": 53.16, "elapsed_time": "0:35:51", "remaining_time": "0:31:35"}
{"current_steps": 522, "total_steps": 980, "loss": 0.0157, "lr": 5.320351099903565e-06, "epoch": 18.642857142857142, "percentage": 53.27, "elapsed_time": "0:35:56", "remaining_time": "0:31:31"}
{"current_steps": 523, "total_steps": 980, "loss": 0.0136, "lr": 5.302576214650527e-06, "epoch": 18.678571428571427, "percentage": 53.37, "elapsed_time": "0:35:59", "remaining_time": "0:31:27"}
{"current_steps": 524, "total_steps": 980, "loss": 0.0121, "lr": 5.284797490584979e-06, "epoch": 18.714285714285715, "percentage": 53.47, "elapsed_time": "0:36:03", "remaining_time": "0:31:22"}
{"current_steps": 525, "total_steps": 980, "loss": 0.0125, "lr": 5.267015153267246e-06, "epoch": 18.75, "percentage": 53.57, "elapsed_time": "0:36:07", "remaining_time": "0:31:18"}
{"current_steps": 526, "total_steps": 980, "loss": 0.0124, "lr": 5.249229428303486e-06, "epoch": 18.785714285714285, "percentage": 53.67, "elapsed_time": "0:36:11", "remaining_time": "0:31:14"}
{"current_steps": 527, "total_steps": 980, "loss": 0.0197, "lr": 5.231440541342846e-06, "epoch": 18.821428571428573, "percentage": 53.78, "elapsed_time": "0:36:15", "remaining_time": "0:31:09"}
{"current_steps": 528, "total_steps": 980, "loss": 0.0122, "lr": 5.213648718074584e-06, "epoch": 18.857142857142858, "percentage": 53.88, "elapsed_time": "0:36:18", "remaining_time": "0:31:04"}
{"current_steps": 529, "total_steps": 980, "loss": 0.0136, "lr": 5.1958541842252145e-06, "epoch": 18.892857142857142, "percentage": 53.98, "elapsed_time": "0:36:21", "remaining_time": "0:30:59"}
{"current_steps": 530, "total_steps": 980, "loss": 0.0143, "lr": 5.178057165555636e-06, "epoch": 18.928571428571427, "percentage": 54.08, "elapsed_time": "0:36:25", "remaining_time": "0:30:55"}
{"current_steps": 531, "total_steps": 980, "loss": 0.0144, "lr": 5.160257887858278e-06, "epoch": 18.964285714285715, "percentage": 54.18, "elapsed_time": "0:36:28", "remaining_time": "0:30:50"}
{"current_steps": 532, "total_steps": 980, "loss": 0.0104, "lr": 5.142456576954225e-06, "epoch": 19.0, "percentage": 54.29, "elapsed_time": "0:36:32", "remaining_time": "0:30:46"}
{"current_steps": 533, "total_steps": 980, "loss": 0.0082, "lr": 5.1246534586903655e-06, "epoch": 19.035714285714285, "percentage": 54.39, "elapsed_time": "0:36:37", "remaining_time": "0:30:42"}
{"current_steps": 534, "total_steps": 980, "loss": 0.0122, "lr": 5.106848758936508e-06, "epoch": 19.071428571428573, "percentage": 54.49, "elapsed_time": "0:36:40", "remaining_time": "0:30:37"}
{"current_steps": 535, "total_steps": 980, "loss": 0.0101, "lr": 5.089042703582533e-06, "epoch": 19.107142857142858, "percentage": 54.59, "elapsed_time": "0:36:43", "remaining_time": "0:30:32"}
{"current_steps": 536, "total_steps": 980, "loss": 0.0105, "lr": 5.071235518535516e-06, "epoch": 19.142857142857142, "percentage": 54.69, "elapsed_time": "0:36:46", "remaining_time": "0:30:28"}
{"current_steps": 537, "total_steps": 980, "loss": 0.0106, "lr": 5.053427429716867e-06, "epoch": 19.178571428571427, "percentage": 54.8, "elapsed_time": "0:36:50", "remaining_time": "0:30:23"}
{"current_steps": 538, "total_steps": 980, "loss": 0.0076, "lr": 5.0356186630594585e-06, "epoch": 19.214285714285715, "percentage": 54.9, "elapsed_time": "0:36:53", "remaining_time": "0:30:18"}
{"current_steps": 539, "total_steps": 980, "loss": 0.0117, "lr": 5.017809444504768e-06, "epoch": 19.25, "percentage": 55.0, "elapsed_time": "0:36:57", "remaining_time": "0:30:14"}
{"current_steps": 540, "total_steps": 980, "loss": 0.012, "lr": 5e-06, "epoch": 19.285714285714285, "percentage": 55.1, "elapsed_time": "0:37:01", "remaining_time": "0:30:10"}
{"current_steps": 541, "total_steps": 980, "loss": 0.0073, "lr": 4.982190555495236e-06, "epoch": 19.321428571428573, "percentage": 55.2, "elapsed_time": "0:37:04", "remaining_time": "0:30:05"}
{"current_steps": 542, "total_steps": 980, "loss": 0.0157, "lr": 4.964381336940542e-06, "epoch": 19.357142857142858, "percentage": 55.31, "elapsed_time": "0:37:07", "remaining_time": "0:30:00"}
{"current_steps": 543, "total_steps": 980, "loss": 0.0098, "lr": 4.946572570283135e-06, "epoch": 19.392857142857142, "percentage": 55.41, "elapsed_time": "0:37:11", "remaining_time": "0:29:55"}
{"current_steps": 544, "total_steps": 980, "loss": 0.0138, "lr": 4.928764481464485e-06, "epoch": 19.428571428571427, "percentage": 55.51, "elapsed_time": "0:37:15", "remaining_time": "0:29:51"}
{"current_steps": 545, "total_steps": 980, "loss": 0.0131, "lr": 4.910957296417467e-06, "epoch": 19.464285714285715, "percentage": 55.61, "elapsed_time": "0:37:18", "remaining_time": "0:29:47"}
{"current_steps": 546, "total_steps": 980, "loss": 0.0133, "lr": 4.893151241063493e-06, "epoch": 19.5, "percentage": 55.71, "elapsed_time": "0:37:22", "remaining_time": "0:29:42"}
{"current_steps": 547, "total_steps": 980, "loss": 0.0139, "lr": 4.875346541309637e-06, "epoch": 19.535714285714285, "percentage": 55.82, "elapsed_time": "0:37:25", "remaining_time": "0:29:37"}
{"current_steps": 548, "total_steps": 980, "loss": 0.0105, "lr": 4.857543423045775e-06, "epoch": 19.571428571428573, "percentage": 55.92, "elapsed_time": "0:37:29", "remaining_time": "0:29:33"}
{"current_steps": 549, "total_steps": 980, "loss": 0.0104, "lr": 4.839742112141725e-06, "epoch": 19.607142857142858, "percentage": 56.02, "elapsed_time": "0:37:33", "remaining_time": "0:29:28"}
{"current_steps": 550, "total_steps": 980, "loss": 0.0127, "lr": 4.821942834444367e-06, "epoch": 19.642857142857142, "percentage": 56.12, "elapsed_time": "0:37:37", "remaining_time": "0:29:24"}
{"current_steps": 551, "total_steps": 980, "loss": 0.0106, "lr": 4.804145815774787e-06, "epoch": 19.678571428571427, "percentage": 56.22, "elapsed_time": "0:37:40", "remaining_time": "0:29:20"}
{"current_steps": 552, "total_steps": 980, "loss": 0.0114, "lr": 4.786351281925417e-06, "epoch": 19.714285714285715, "percentage": 56.33, "elapsed_time": "0:37:43", "remaining_time": "0:29:15"}
{"current_steps": 553, "total_steps": 980, "loss": 0.0127, "lr": 4.768559458657156e-06, "epoch": 19.75, "percentage": 56.43, "elapsed_time": "0:37:47", "remaining_time": "0:29:11"}
{"current_steps": 554, "total_steps": 980, "loss": 0.0176, "lr": 4.750770571696514e-06, "epoch": 19.785714285714285, "percentage": 56.53, "elapsed_time": "0:37:51", "remaining_time": "0:29:06"}
{"current_steps": 555, "total_steps": 980, "loss": 0.0139, "lr": 4.732984846732755e-06, "epoch": 19.821428571428573, "percentage": 56.63, "elapsed_time": "0:37:55", "remaining_time": "0:29:02"}
{"current_steps": 556, "total_steps": 980, "loss": 0.0098, "lr": 4.7152025094150214e-06, "epoch": 19.857142857142858, "percentage": 56.73, "elapsed_time": "0:37:59", "remaining_time": "0:28:58"}
{"current_steps": 557, "total_steps": 980, "loss": 0.0112, "lr": 4.697423785349475e-06, "epoch": 19.892857142857142, "percentage": 56.84, "elapsed_time": "0:38:03", "remaining_time": "0:28:54"}
{"current_steps": 558, "total_steps": 980, "loss": 0.018, "lr": 4.679648900096436e-06, "epoch": 19.928571428571427, "percentage": 56.94, "elapsed_time": "0:38:06", "remaining_time": "0:28:49"}
{"current_steps": 559, "total_steps": 980, "loss": 0.0134, "lr": 4.661878079167527e-06, "epoch": 19.964285714285715, "percentage": 57.04, "elapsed_time": "0:38:10", "remaining_time": "0:28:44"}
{"current_steps": 560, "total_steps": 980, "loss": 0.0077, "lr": 4.644111548022798e-06, "epoch": 20.0, "percentage": 57.14, "elapsed_time": "0:38:14", "remaining_time": "0:28:40"}
{"current_steps": 561, "total_steps": 980, "loss": 0.0101, "lr": 4.626349532067879e-06, "epoch": 20.035714285714285, "percentage": 57.24, "elapsed_time": "0:38:18", "remaining_time": "0:28:36"}
{"current_steps": 562, "total_steps": 980, "loss": 0.0083, "lr": 4.608592256651117e-06, "epoch": 20.071428571428573, "percentage": 57.35, "elapsed_time": "0:38:21", "remaining_time": "0:28:32"}
{"current_steps": 563, "total_steps": 980, "loss": 0.0109, "lr": 4.5908399470607106e-06, "epoch": 20.107142857142858, "percentage": 57.45, "elapsed_time": "0:38:25", "remaining_time": "0:28:27"}
{"current_steps": 564, "total_steps": 980, "loss": 0.0101, "lr": 4.573092828521857e-06, "epoch": 20.142857142857142, "percentage": 57.55, "elapsed_time": "0:38:29", "remaining_time": "0:28:23"}
{"current_steps": 565, "total_steps": 980, "loss": 0.0097, "lr": 4.555351126193901e-06, "epoch": 20.178571428571427, "percentage": 57.65, "elapsed_time": "0:38:32", "remaining_time": "0:28:18"}
{"current_steps": 566, "total_steps": 980, "loss": 0.011, "lr": 4.537615065167461e-06, "epoch": 20.214285714285715, "percentage": 57.76, "elapsed_time": "0:38:35", "remaining_time": "0:28:13"}
{"current_steps": 567, "total_steps": 980, "loss": 0.012, "lr": 4.5198848704615915e-06, "epoch": 20.25, "percentage": 57.86, "elapsed_time": "0:38:39", "remaining_time": "0:28:09"}
{"current_steps": 568, "total_steps": 980, "loss": 0.0086, "lr": 4.502160767020918e-06, "epoch": 20.285714285714285, "percentage": 57.96, "elapsed_time": "0:38:42", "remaining_time": "0:28:04"}
{"current_steps": 569, "total_steps": 980, "loss": 0.0114, "lr": 4.484442979712783e-06, "epoch": 20.321428571428573, "percentage": 58.06, "elapsed_time": "0:38:46", "remaining_time": "0:28:00"}
{"current_steps": 570, "total_steps": 980, "loss": 0.0084, "lr": 4.466731733324399e-06, "epoch": 20.357142857142858, "percentage": 58.16, "elapsed_time": "0:38:50", "remaining_time": "0:27:56"}
{"current_steps": 571, "total_steps": 980, "loss": 0.0095, "lr": 4.449027252559994e-06, "epoch": 20.392857142857142, "percentage": 58.27, "elapsed_time": "0:38:53", "remaining_time": "0:27:51"}
{"current_steps": 572, "total_steps": 980, "loss": 0.009, "lr": 4.431329762037958e-06, "epoch": 20.428571428571427, "percentage": 58.37, "elapsed_time": "0:38:58", "remaining_time": "0:27:47"}
{"current_steps": 573, "total_steps": 980, "loss": 0.0147, "lr": 4.413639486287992e-06, "epoch": 20.464285714285715, "percentage": 58.47, "elapsed_time": "0:39:02", "remaining_time": "0:27:43"}
{"current_steps": 574, "total_steps": 980, "loss": 0.0144, "lr": 4.395956649748269e-06, "epoch": 20.5, "percentage": 58.57, "elapsed_time": "0:39:05", "remaining_time": "0:27:39"}
{"current_steps": 575, "total_steps": 980, "loss": 0.0097, "lr": 4.3782814767625755e-06, "epoch": 20.535714285714285, "percentage": 58.67, "elapsed_time": "0:39:09", "remaining_time": "0:27:35"}
{"current_steps": 576, "total_steps": 980, "loss": 0.0107, "lr": 4.3606141915774695e-06, "epoch": 20.571428571428573, "percentage": 58.78, "elapsed_time": "0:39:13", "remaining_time": "0:27:30"}
{"current_steps": 577, "total_steps": 980, "loss": 0.0125, "lr": 4.342955018339442e-06, "epoch": 20.607142857142858, "percentage": 58.88, "elapsed_time": "0:39:17", "remaining_time": "0:27:26"}
{"current_steps": 578, "total_steps": 980, "loss": 0.0097, "lr": 4.3253041810920595e-06, "epoch": 20.642857142857142, "percentage": 58.98, "elapsed_time": "0:39:20", "remaining_time": "0:27:21"}
{"current_steps": 579, "total_steps": 980, "loss": 0.0104, "lr": 4.307661903773129e-06, "epoch": 20.678571428571427, "percentage": 59.08, "elapsed_time": "0:39:23", "remaining_time": "0:27:17"}
{"current_steps": 580, "total_steps": 980, "loss": 0.0094, "lr": 4.290028410211866e-06, "epoch": 20.714285714285715, "percentage": 59.18, "elapsed_time": "0:39:27", "remaining_time": "0:27:12"}
{"current_steps": 581, "total_steps": 980, "loss": 0.0108, "lr": 4.272403924126035e-06, "epoch": 20.75, "percentage": 59.29, "elapsed_time": "0:39:31", "remaining_time": "0:27:08"}
{"current_steps": 582, "total_steps": 980, "loss": 0.0138, "lr": 4.254788669119127e-06, "epoch": 20.785714285714285, "percentage": 59.39, "elapsed_time": "0:39:35", "remaining_time": "0:27:04"}
{"current_steps": 583, "total_steps": 980, "loss": 0.0121, "lr": 4.237182868677519e-06, "epoch": 20.821428571428573, "percentage": 59.49, "elapsed_time": "0:39:39", "remaining_time": "0:27:00"}
{"current_steps": 584, "total_steps": 980, "loss": 0.0122, "lr": 4.219586746167632e-06, "epoch": 20.857142857142858, "percentage": 59.59, "elapsed_time": "0:39:43", "remaining_time": "0:26:56"}
{"current_steps": 585, "total_steps": 980, "loss": 0.0115, "lr": 4.2020005248331056e-06, "epoch": 20.892857142857142, "percentage": 59.69, "elapsed_time": "0:39:46", "remaining_time": "0:26:51"}
{"current_steps": 586, "total_steps": 980, "loss": 0.0163, "lr": 4.18442442779196e-06, "epoch": 20.928571428571427, "percentage": 59.8, "elapsed_time": "0:39:50", "remaining_time": "0:26:47"}
{"current_steps": 587, "total_steps": 980, "loss": 0.0113, "lr": 4.166858678033771e-06, "epoch": 20.964285714285715, "percentage": 59.9, "elapsed_time": "0:39:53", "remaining_time": "0:26:42"}
{"current_steps": 588, "total_steps": 980, "loss": 0.0107, "lr": 4.149303498416838e-06, "epoch": 21.0, "percentage": 60.0, "elapsed_time": "0:39:58", "remaining_time": "0:26:38"}
{"current_steps": 589, "total_steps": 980, "loss": 0.0105, "lr": 4.131759111665349e-06, "epoch": 21.035714285714285, "percentage": 60.1, "elapsed_time": "0:40:01", "remaining_time": "0:26:34"}
{"current_steps": 590, "total_steps": 980, "loss": 0.0073, "lr": 4.114225740366569e-06, "epoch": 21.071428571428573, "percentage": 60.2, "elapsed_time": "0:40:04", "remaining_time": "0:26:29"}
{"current_steps": 591, "total_steps": 980, "loss": 0.0095, "lr": 4.096703606968007e-06, "epoch": 21.107142857142858, "percentage": 60.31, "elapsed_time": "0:40:09", "remaining_time": "0:26:25"}
{"current_steps": 592, "total_steps": 980, "loss": 0.0096, "lr": 4.079192933774592e-06, "epoch": 21.142857142857142, "percentage": 60.41, "elapsed_time": "0:40:12", "remaining_time": "0:26:21"}
{"current_steps": 593, "total_steps": 980, "loss": 0.0088, "lr": 4.061693942945863e-06, "epoch": 21.178571428571427, "percentage": 60.51, "elapsed_time": "0:40:16", "remaining_time": "0:26:17"}
{"current_steps": 594, "total_steps": 980, "loss": 0.0092, "lr": 4.04420685649314e-06, "epoch": 21.214285714285715, "percentage": 60.61, "elapsed_time": "0:40:20", "remaining_time": "0:26:12"}
{"current_steps": 595, "total_steps": 980, "loss": 0.0088, "lr": 4.026731896276708e-06, "epoch": 21.25, "percentage": 60.71, "elapsed_time": "0:40:23", "remaining_time": "0:26:08"}
{"current_steps": 596, "total_steps": 980, "loss": 0.0105, "lr": 4.009269284003014e-06, "epoch": 21.285714285714285, "percentage": 60.82, "elapsed_time": "0:40:27", "remaining_time": "0:26:04"}
{"current_steps": 597, "total_steps": 980, "loss": 0.0096, "lr": 3.991819241221836e-06, "epoch": 21.321428571428573, "percentage": 60.92, "elapsed_time": "0:40:31", "remaining_time": "0:25:59"}
{"current_steps": 598, "total_steps": 980, "loss": 0.0087, "lr": 3.974381989323484e-06, "epoch": 21.357142857142858, "percentage": 61.02, "elapsed_time": "0:40:34", "remaining_time": "0:25:55"}
{"current_steps": 599, "total_steps": 980, "loss": 0.0111, "lr": 3.956957749535997e-06, "epoch": 21.392857142857142, "percentage": 61.12, "elapsed_time": "0:40:37", "remaining_time": "0:25:50"}
{"current_steps": 600, "total_steps": 980, "loss": 0.0108, "lr": 3.939546742922318e-06, "epoch": 21.428571428571427, "percentage": 61.22, "elapsed_time": "0:40:42", "remaining_time": "0:25:46"}
{"current_steps": 600, "total_steps": 980, "eval_loss": 2.483830213546753, "epoch": 21.428571428571427, "percentage": 61.22, "elapsed_time": "0:40:42", "remaining_time": "0:25:46"}
{"current_steps": 601, "total_steps": 980, "loss": 0.0088, "lr": 3.9221491903775014e-06, "epoch": 21.464285714285715, "percentage": 61.33, "elapsed_time": "0:41:30", "remaining_time": "0:26:10"}
{"current_steps": 602, "total_steps": 980, "loss": 0.0093, "lr": 3.904765312625916e-06, "epoch": 21.5, "percentage": 61.43, "elapsed_time": "0:41:35", "remaining_time": "0:26:06"}
{"current_steps": 603, "total_steps": 980, "loss": 0.0122, "lr": 3.887395330218429e-06, "epoch": 21.535714285714285, "percentage": 61.53, "elapsed_time": "0:41:38", "remaining_time": "0:26:02"}
{"current_steps": 604, "total_steps": 980, "loss": 0.0101, "lr": 3.8700394635296166e-06, "epoch": 21.571428571428573, "percentage": 61.63, "elapsed_time": "0:41:42", "remaining_time": "0:25:57"}
{"current_steps": 605, "total_steps": 980, "loss": 0.0126, "lr": 3.852697932754974e-06, "epoch": 21.607142857142858, "percentage": 61.73, "elapsed_time": "0:41:46", "remaining_time": "0:25:53"}
{"current_steps": 606, "total_steps": 980, "loss": 0.0108, "lr": 3.835370957908108e-06, "epoch": 21.642857142857142, "percentage": 61.84, "elapsed_time": "0:41:50", "remaining_time": "0:25:49"}
{"current_steps": 607, "total_steps": 980, "loss": 0.0091, "lr": 3.818058758817956e-06, "epoch": 21.678571428571427, "percentage": 61.94, "elapsed_time": "0:41:53", "remaining_time": "0:25:44"}
{"current_steps": 608, "total_steps": 980, "loss": 0.0118, "lr": 3.800761555125997e-06, "epoch": 21.714285714285715, "percentage": 62.04, "elapsed_time": "0:41:57", "remaining_time": "0:25:40"}
{"current_steps": 609, "total_steps": 980, "loss": 0.0107, "lr": 3.783479566283457e-06, "epoch": 21.75, "percentage": 62.14, "elapsed_time": "0:42:00", "remaining_time": "0:25:35"}
{"current_steps": 610, "total_steps": 980, "loss": 0.0147, "lr": 3.7662130115485317e-06, "epoch": 21.785714285714285, "percentage": 62.24, "elapsed_time": "0:42:04", "remaining_time": "0:25:31"}
{"current_steps": 611, "total_steps": 980, "loss": 0.0125, "lr": 3.748962109983605e-06, "epoch": 21.821428571428573, "percentage": 62.35, "elapsed_time": "0:42:08", "remaining_time": "0:25:26"}
{"current_steps": 612, "total_steps": 980, "loss": 0.011, "lr": 3.731727080452464e-06, "epoch": 21.857142857142858, "percentage": 62.45, "elapsed_time": "0:42:12", "remaining_time": "0:25:22"}
{"current_steps": 613, "total_steps": 980, "loss": 0.0121, "lr": 3.714508141617527e-06, "epoch": 21.892857142857142, "percentage": 62.55, "elapsed_time": "0:42:15", "remaining_time": "0:25:18"}
{"current_steps": 614, "total_steps": 980, "loss": 0.0128, "lr": 3.69730551193707e-06, "epoch": 21.928571428571427, "percentage": 62.65, "elapsed_time": "0:42:18", "remaining_time": "0:25:13"}
{"current_steps": 615, "total_steps": 980, "loss": 0.0121, "lr": 3.6801194096624515e-06, "epoch": 21.964285714285715, "percentage": 62.76, "elapsed_time": "0:42:22", "remaining_time": "0:25:09"}
{"current_steps": 616, "total_steps": 980, "loss": 0.0098, "lr": 3.6629500528353464e-06, "epoch": 22.0, "percentage": 62.86, "elapsed_time": "0:42:26", "remaining_time": "0:25:04"}
{"current_steps": 617, "total_steps": 980, "loss": 0.0082, "lr": 3.6457976592849753e-06, "epoch": 22.035714285714285, "percentage": 62.96, "elapsed_time": "0:42:30", "remaining_time": "0:25:00"}
{"current_steps": 618, "total_steps": 980, "loss": 0.0079, "lr": 3.6286624466253496e-06, "epoch": 22.071428571428573, "percentage": 63.06, "elapsed_time": "0:42:33", "remaining_time": "0:24:55"}
{"current_steps": 619, "total_steps": 980, "loss": 0.0074, "lr": 3.6115446322525007e-06, "epoch": 22.107142857142858, "percentage": 63.16, "elapsed_time": "0:42:37", "remaining_time": "0:24:51"}
{"current_steps": 620, "total_steps": 980, "loss": 0.0113, "lr": 3.594444433341725e-06, "epoch": 22.142857142857142, "percentage": 63.27, "elapsed_time": "0:42:40", "remaining_time": "0:24:46"}
{"current_steps": 621, "total_steps": 980, "loss": 0.0079, "lr": 3.5773620668448384e-06, "epoch": 22.178571428571427, "percentage": 63.37, "elapsed_time": "0:42:44", "remaining_time": "0:24:42"}
{"current_steps": 622, "total_steps": 980, "loss": 0.0077, "lr": 3.560297749487407e-06, "epoch": 22.214285714285715, "percentage": 63.47, "elapsed_time": "0:42:48", "remaining_time": "0:24:38"}
{"current_steps": 623, "total_steps": 980, "loss": 0.0097, "lr": 3.543251697766006e-06, "epoch": 22.25, "percentage": 63.57, "elapsed_time": "0:42:51", "remaining_time": "0:24:33"}
{"current_steps": 624, "total_steps": 980, "loss": 0.0074, "lr": 3.526224127945479e-06, "epoch": 22.285714285714285, "percentage": 63.67, "elapsed_time": "0:42:55", "remaining_time": "0:24:29"}
{"current_steps": 625, "total_steps": 980, "loss": 0.0087, "lr": 3.5092152560561833e-06, "epoch": 22.321428571428573, "percentage": 63.78, "elapsed_time": "0:42:59", "remaining_time": "0:24:25"}
{"current_steps": 626, "total_steps": 980, "loss": 0.0069, "lr": 3.4922252978912523e-06, "epoch": 22.357142857142858, "percentage": 63.88, "elapsed_time": "0:43:03", "remaining_time": "0:24:20"}
{"current_steps": 627, "total_steps": 980, "loss": 0.0076, "lr": 3.475254469003865e-06, "epoch": 22.392857142857142, "percentage": 63.98, "elapsed_time": "0:43:06", "remaining_time": "0:24:16"}
{"current_steps": 628, "total_steps": 980, "loss": 0.0099, "lr": 3.4583029847044996e-06, "epoch": 22.428571428571427, "percentage": 64.08, "elapsed_time": "0:43:09", "remaining_time": "0:24:11"}
{"current_steps": 629, "total_steps": 980, "loss": 0.0092, "lr": 3.4413710600582096e-06, "epoch": 22.464285714285715, "percentage": 64.18, "elapsed_time": "0:43:13", "remaining_time": "0:24:07"}
{"current_steps": 630, "total_steps": 980, "loss": 0.0113, "lr": 3.424458909881897e-06, "epoch": 22.5, "percentage": 64.29, "elapsed_time": "0:43:17", "remaining_time": "0:24:02"}
{"current_steps": 631, "total_steps": 980, "loss": 0.0102, "lr": 3.4075667487415785e-06, "epoch": 22.535714285714285, "percentage": 64.39, "elapsed_time": "0:43:21", "remaining_time": "0:23:58"}
{"current_steps": 632, "total_steps": 980, "loss": 0.0126, "lr": 3.3906947909496696e-06, "epoch": 22.571428571428573, "percentage": 64.49, "elapsed_time": "0:43:24", "remaining_time": "0:23:54"}
{"current_steps": 633, "total_steps": 980, "loss": 0.0099, "lr": 3.3738432505622653e-06, "epoch": 22.607142857142858, "percentage": 64.59, "elapsed_time": "0:43:28", "remaining_time": "0:23:50"}
{"current_steps": 634, "total_steps": 980, "loss": 0.0105, "lr": 3.357012341376421e-06, "epoch": 22.642857142857142, "percentage": 64.69, "elapsed_time": "0:43:32", "remaining_time": "0:23:45"}
{"current_steps": 635, "total_steps": 980, "loss": 0.014, "lr": 3.3402022769274422e-06, "epoch": 22.678571428571427, "percentage": 64.8, "elapsed_time": "0:43:35", "remaining_time": "0:23:41"}
{"current_steps": 636, "total_steps": 980, "loss": 0.0094, "lr": 3.3234132704861786e-06, "epoch": 22.714285714285715, "percentage": 64.9, "elapsed_time": "0:43:38", "remaining_time": "0:23:36"}
{"current_steps": 637, "total_steps": 980, "loss": 0.0127, "lr": 3.306645535056312e-06, "epoch": 22.75, "percentage": 65.0, "elapsed_time": "0:43:43", "remaining_time": "0:23:32"}
{"current_steps": 638, "total_steps": 980, "loss": 0.0125, "lr": 3.289899283371657e-06, "epoch": 22.785714285714285, "percentage": 65.1, "elapsed_time": "0:43:46", "remaining_time": "0:23:27"}
{"current_steps": 639, "total_steps": 980, "loss": 0.0098, "lr": 3.273174727893463e-06, "epoch": 22.821428571428573, "percentage": 65.2, "elapsed_time": "0:43:50", "remaining_time": "0:23:23"}
{"current_steps": 640, "total_steps": 980, "loss": 0.0149, "lr": 3.2564720808077167e-06, "epoch": 22.857142857142858, "percentage": 65.31, "elapsed_time": "0:43:54", "remaining_time": "0:23:19"}
{"current_steps": 641, "total_steps": 980, "loss": 0.0115, "lr": 3.2397915540224493e-06, "epoch": 22.892857142857142, "percentage": 65.41, "elapsed_time": "0:43:58", "remaining_time": "0:23:15"}
{"current_steps": 642, "total_steps": 980, "loss": 0.0111, "lr": 3.2231333591650567e-06, "epoch": 22.928571428571427, "percentage": 65.51, "elapsed_time": "0:44:01", "remaining_time": "0:23:10"}
{"current_steps": 643, "total_steps": 980, "loss": 0.0117, "lr": 3.2064977075795988e-06, "epoch": 22.964285714285715, "percentage": 65.61, "elapsed_time": "0:44:04", "remaining_time": "0:23:06"}
{"current_steps": 644, "total_steps": 980, "loss": 0.0086, "lr": 3.189884810324133e-06, "epoch": 23.0, "percentage": 65.71, "elapsed_time": "0:44:08", "remaining_time": "0:23:02"}
{"current_steps": 645, "total_steps": 980, "loss": 0.0107, "lr": 3.173294878168025e-06, "epoch": 23.035714285714285, "percentage": 65.82, "elapsed_time": "0:44:12", "remaining_time": "0:22:57"}
{"current_steps": 646, "total_steps": 980, "loss": 0.0047, "lr": 3.1567281215892868e-06, "epoch": 23.071428571428573, "percentage": 65.92, "elapsed_time": "0:44:15", "remaining_time": "0:22:53"}
{"current_steps": 647, "total_steps": 980, "loss": 0.009, "lr": 3.140184750771895e-06, "epoch": 23.107142857142858, "percentage": 66.02, "elapsed_time": "0:44:19", "remaining_time": "0:22:48"}
{"current_steps": 648, "total_steps": 980, "loss": 0.0091, "lr": 3.12366497560313e-06, "epoch": 23.142857142857142, "percentage": 66.12, "elapsed_time": "0:44:22", "remaining_time": "0:22:44"}
{"current_steps": 649, "total_steps": 980, "loss": 0.0079, "lr": 3.1071690056709125e-06, "epoch": 23.178571428571427, "percentage": 66.22, "elapsed_time": "0:44:26", "remaining_time": "0:22:40"}
{"current_steps": 650, "total_steps": 980, "loss": 0.0082, "lr": 3.090697050261143e-06, "epoch": 23.214285714285715, "percentage": 66.33, "elapsed_time": "0:44:30", "remaining_time": "0:22:35"}
{"current_steps": 651, "total_steps": 980, "loss": 0.0078, "lr": 3.074249318355046e-06, "epoch": 23.25, "percentage": 66.43, "elapsed_time": "0:44:35", "remaining_time": "0:22:31"}
{"current_steps": 652, "total_steps": 980, "loss": 0.0077, "lr": 3.057826018626527e-06, "epoch": 23.285714285714285, "percentage": 66.53, "elapsed_time": "0:44:39", "remaining_time": "0:22:27"}
{"current_steps": 653, "total_steps": 980, "loss": 0.0073, "lr": 3.0414273594395106e-06, "epoch": 23.321428571428573, "percentage": 66.63, "elapsed_time": "0:44:43", "remaining_time": "0:22:23"}
{"current_steps": 654, "total_steps": 980, "loss": 0.0113, "lr": 3.0250535488453077e-06, "epoch": 23.357142857142858, "percentage": 66.73, "elapsed_time": "0:44:47", "remaining_time": "0:22:19"}
{"current_steps": 655, "total_steps": 980, "loss": 0.0079, "lr": 3.008704794579973e-06, "epoch": 23.392857142857142, "percentage": 66.84, "elapsed_time": "0:44:51", "remaining_time": "0:22:15"}
{"current_steps": 656, "total_steps": 980, "loss": 0.0088, "lr": 2.9923813040616685e-06, "epoch": 23.428571428571427, "percentage": 66.94, "elapsed_time": "0:44:55", "remaining_time": "0:22:11"}
{"current_steps": 657, "total_steps": 980, "loss": 0.0111, "lr": 2.976083284388031e-06, "epoch": 23.464285714285715, "percentage": 67.04, "elapsed_time": "0:44:59", "remaining_time": "0:22:07"}
{"current_steps": 658, "total_steps": 980, "loss": 0.0117, "lr": 2.959810942333552e-06, "epoch": 23.5, "percentage": 67.14, "elapsed_time": "0:45:02", "remaining_time": "0:22:02"}
{"current_steps": 659, "total_steps": 980, "loss": 0.008, "lr": 2.9435644843469434e-06, "epoch": 23.535714285714285, "percentage": 67.24, "elapsed_time": "0:45:06", "remaining_time": "0:21:58"}
{"current_steps": 660, "total_steps": 980, "loss": 0.0078, "lr": 2.9273441165485227e-06, "epoch": 23.571428571428573, "percentage": 67.35, "elapsed_time": "0:45:10", "remaining_time": "0:21:54"}
{"current_steps": 661, "total_steps": 980, "loss": 0.0141, "lr": 2.9111500447276053e-06, "epoch": 23.607142857142858, "percentage": 67.45, "elapsed_time": "0:45:14", "remaining_time": "0:21:49"}
{"current_steps": 662, "total_steps": 980, "loss": 0.0095, "lr": 2.8949824743398804e-06, "epoch": 23.642857142857142, "percentage": 67.55, "elapsed_time": "0:45:17", "remaining_time": "0:21:45"}
{"current_steps": 663, "total_steps": 980, "loss": 0.0104, "lr": 2.8788416105048124e-06, "epoch": 23.678571428571427, "percentage": 67.65, "elapsed_time": "0:45:21", "remaining_time": "0:21:41"}
{"current_steps": 664, "total_steps": 980, "loss": 0.0122, "lr": 2.862727658003042e-06, "epoch": 23.714285714285715, "percentage": 67.76, "elapsed_time": "0:45:24", "remaining_time": "0:21:36"}
{"current_steps": 665, "total_steps": 980, "loss": 0.0091, "lr": 2.8466408212737777e-06, "epoch": 23.75, "percentage": 67.86, "elapsed_time": "0:45:28", "remaining_time": "0:21:32"}
{"current_steps": 666, "total_steps": 980, "loss": 0.0115, "lr": 2.83058130441221e-06, "epoch": 23.785714285714285, "percentage": 67.96, "elapsed_time": "0:45:31", "remaining_time": "0:21:27"}
{"current_steps": 667, "total_steps": 980, "loss": 0.01, "lr": 2.8145493111669186e-06, "epoch": 23.821428571428573, "percentage": 68.06, "elapsed_time": "0:45:34", "remaining_time": "0:21:23"}
{"current_steps": 668, "total_steps": 980, "loss": 0.0133, "lr": 2.79854504493729e-06, "epoch": 23.857142857142858, "percentage": 68.16, "elapsed_time": "0:45:37", "remaining_time": "0:21:18"}
{"current_steps": 669, "total_steps": 980, "loss": 0.0094, "lr": 2.782568708770933e-06, "epoch": 23.892857142857142, "percentage": 68.27, "elapsed_time": "0:45:41", "remaining_time": "0:21:14"}
{"current_steps": 670, "total_steps": 980, "loss": 0.0126, "lr": 2.7666205053611097e-06, "epoch": 23.928571428571427, "percentage": 68.37, "elapsed_time": "0:45:45", "remaining_time": "0:21:10"}
{"current_steps": 671, "total_steps": 980, "loss": 0.012, "lr": 2.7507006370441557e-06, "epoch": 23.964285714285715, "percentage": 68.47, "elapsed_time": "0:45:48", "remaining_time": "0:21:05"}
{"current_steps": 672, "total_steps": 980, "loss": 0.0101, "lr": 2.734809305796915e-06, "epoch": 24.0, "percentage": 68.57, "elapsed_time": "0:45:52", "remaining_time": "0:21:01"}
{"current_steps": 673, "total_steps": 980, "loss": 0.0113, "lr": 2.718946713234185e-06, "epoch": 24.035714285714285, "percentage": 68.67, "elapsed_time": "0:45:56", "remaining_time": "0:20:57"}
{"current_steps": 674, "total_steps": 980, "loss": 0.0094, "lr": 2.7031130606061486e-06, "epoch": 24.071428571428573, "percentage": 68.78, "elapsed_time": "0:45:59", "remaining_time": "0:20:52"}
{"current_steps": 675, "total_steps": 980, "loss": 0.0078, "lr": 2.687308548795825e-06, "epoch": 24.107142857142858, "percentage": 68.88, "elapsed_time": "0:46:03", "remaining_time": "0:20:48"}
{"current_steps": 676, "total_steps": 980, "loss": 0.0085, "lr": 2.67153337831652e-06, "epoch": 24.142857142857142, "percentage": 68.98, "elapsed_time": "0:46:06", "remaining_time": "0:20:44"}
{"current_steps": 677, "total_steps": 980, "loss": 0.0098, "lr": 2.6557877493092885e-06, "epoch": 24.178571428571427, "percentage": 69.08, "elapsed_time": "0:46:09", "remaining_time": "0:20:39"}
{"current_steps": 678, "total_steps": 980, "loss": 0.0075, "lr": 2.6400718615403852e-06, "epoch": 24.214285714285715, "percentage": 69.18, "elapsed_time": "0:46:12", "remaining_time": "0:20:35"}
{"current_steps": 679, "total_steps": 980, "loss": 0.0122, "lr": 2.624385914398737e-06, "epoch": 24.25, "percentage": 69.29, "elapsed_time": "0:46:17", "remaining_time": "0:20:31"}
{"current_steps": 680, "total_steps": 980, "loss": 0.0067, "lr": 2.608730106893411e-06, "epoch": 24.285714285714285, "percentage": 69.39, "elapsed_time": "0:46:21", "remaining_time": "0:20:27"}
{"current_steps": 681, "total_steps": 980, "loss": 0.0077, "lr": 2.5931046376510875e-06, "epoch": 24.321428571428573, "percentage": 69.49, "elapsed_time": "0:46:24", "remaining_time": "0:20:22"}
{"current_steps": 682, "total_steps": 980, "loss": 0.0075, "lr": 2.5775097049135445e-06, "epoch": 24.357142857142858, "percentage": 69.59, "elapsed_time": "0:46:27", "remaining_time": "0:20:18"}
{"current_steps": 683, "total_steps": 980, "loss": 0.0102, "lr": 2.561945506535144e-06, "epoch": 24.392857142857142, "percentage": 69.69, "elapsed_time": "0:46:31", "remaining_time": "0:20:13"}
{"current_steps": 684, "total_steps": 980, "loss": 0.0099, "lr": 2.5464122399803126e-06, "epoch": 24.428571428571427, "percentage": 69.8, "elapsed_time": "0:46:34", "remaining_time": "0:20:09"}
{"current_steps": 685, "total_steps": 980, "loss": 0.0125, "lr": 2.5309101023210426e-06, "epoch": 24.464285714285715, "percentage": 69.9, "elapsed_time": "0:46:37", "remaining_time": "0:20:04"}
{"current_steps": 686, "total_steps": 980, "loss": 0.0061, "lr": 2.5154392902343966e-06, "epoch": 24.5, "percentage": 70.0, "elapsed_time": "0:46:40", "remaining_time": "0:20:00"}
{"current_steps": 687, "total_steps": 980, "loss": 0.0104, "lr": 2.5000000000000015e-06, "epoch": 24.535714285714285, "percentage": 70.1, "elapsed_time": "0:46:45", "remaining_time": "0:19:56"}
{"current_steps": 688, "total_steps": 980, "loss": 0.008, "lr": 2.4845924274975625e-06, "epoch": 24.571428571428573, "percentage": 70.2, "elapsed_time": "0:46:49", "remaining_time": "0:19:52"}
{"current_steps": 689, "total_steps": 980, "loss": 0.0072, "lr": 2.4692167682043855e-06, "epoch": 24.607142857142858, "percentage": 70.31, "elapsed_time": "0:46:53", "remaining_time": "0:19:48"}
{"current_steps": 690, "total_steps": 980, "loss": 0.0129, "lr": 2.4538732171928847e-06, "epoch": 24.642857142857142, "percentage": 70.41, "elapsed_time": "0:46:56", "remaining_time": "0:19:43"}
{"current_steps": 691, "total_steps": 980, "loss": 0.0093, "lr": 2.4385619691281144e-06, "epoch": 24.678571428571427, "percentage": 70.51, "elapsed_time": "0:46:59", "remaining_time": "0:19:39"}
{"current_steps": 692, "total_steps": 980, "loss": 0.01, "lr": 2.4232832182653014e-06, "epoch": 24.714285714285715, "percentage": 70.61, "elapsed_time": "0:47:04", "remaining_time": "0:19:35"}
{"current_steps": 693, "total_steps": 980, "loss": 0.0092, "lr": 2.408037158447375e-06, "epoch": 24.75, "percentage": 70.71, "elapsed_time": "0:47:07", "remaining_time": "0:19:31"}
{"current_steps": 694, "total_steps": 980, "loss": 0.0099, "lr": 2.39282398310251e-06, "epoch": 24.785714285714285, "percentage": 70.82, "elapsed_time": "0:47:11", "remaining_time": "0:19:26"}
{"current_steps": 695, "total_steps": 980, "loss": 0.009, "lr": 2.3776438852416743e-06, "epoch": 24.821428571428573, "percentage": 70.92, "elapsed_time": "0:47:15", "remaining_time": "0:19:22"}
{"current_steps": 696, "total_steps": 980, "loss": 0.0098, "lr": 2.3624970574561773e-06, "epoch": 24.857142857142858, "percentage": 71.02, "elapsed_time": "0:47:19", "remaining_time": "0:19:18"}
{"current_steps": 697, "total_steps": 980, "loss": 0.013, "lr": 2.3473836919152267e-06, "epoch": 24.892857142857142, "percentage": 71.12, "elapsed_time": "0:47:22", "remaining_time": "0:19:14"}
{"current_steps": 698, "total_steps": 980, "loss": 0.0098, "lr": 2.332303980363497e-06, "epoch": 24.928571428571427, "percentage": 71.22, "elapsed_time": "0:47:26", "remaining_time": "0:19:10"}
{"current_steps": 699, "total_steps": 980, "loss": 0.0109, "lr": 2.317258114118686e-06, "epoch": 24.964285714285715, "percentage": 71.33, "elapsed_time": "0:47:30", "remaining_time": "0:19:05"}
{"current_steps": 700, "total_steps": 980, "loss": 0.0119, "lr": 2.3022462840690933e-06, "epoch": 25.0, "percentage": 71.43, "elapsed_time": "0:47:34", "remaining_time": "0:19:01"}
{"current_steps": 700, "total_steps": 980, "eval_loss": 2.5329432487487793, "epoch": 25.0, "percentage": 71.43, "elapsed_time": "0:47:34", "remaining_time": "0:19:01"}
{"current_steps": 701, "total_steps": 980, "loss": 0.0101, "lr": 2.2872686806712037e-06, "epoch": 25.035714285714285, "percentage": 71.53, "elapsed_time": "0:48:23", "remaining_time": "0:19:15"}
{"current_steps": 702, "total_steps": 980, "loss": 0.0078, "lr": 2.272325493947257e-06, "epoch": 25.071428571428573, "percentage": 71.63, "elapsed_time": "0:48:26", "remaining_time": "0:19:11"}
{"current_steps": 703, "total_steps": 980, "loss": 0.0084, "lr": 2.257416913482853e-06, "epoch": 25.107142857142858, "percentage": 71.73, "elapsed_time": "0:48:30", "remaining_time": "0:19:06"}
{"current_steps": 704, "total_steps": 980, "loss": 0.0071, "lr": 2.2425431284245302e-06, "epoch": 25.142857142857142, "percentage": 71.84, "elapsed_time": "0:48:33", "remaining_time": "0:19:02"}
{"current_steps": 705, "total_steps": 980, "loss": 0.0085, "lr": 2.2277043274773856e-06, "epoch": 25.178571428571427, "percentage": 71.94, "elapsed_time": "0:48:36", "remaining_time": "0:18:57"}
{"current_steps": 706, "total_steps": 980, "loss": 0.0079, "lr": 2.2129006989026612e-06, "epoch": 25.214285714285715, "percentage": 72.04, "elapsed_time": "0:48:40", "remaining_time": "0:18:53"}
{"current_steps": 707, "total_steps": 980, "loss": 0.0105, "lr": 2.1981324305153644e-06, "epoch": 25.25, "percentage": 72.14, "elapsed_time": "0:48:43", "remaining_time": "0:18:49"}
{"current_steps": 708, "total_steps": 980, "loss": 0.0099, "lr": 2.1833997096818897e-06, "epoch": 25.285714285714285, "percentage": 72.24, "elapsed_time": "0:48:47", "remaining_time": "0:18:44"}
{"current_steps": 709, "total_steps": 980, "loss": 0.0067, "lr": 2.168702723317632e-06, "epoch": 25.321428571428573, "percentage": 72.35, "elapsed_time": "0:48:50", "remaining_time": "0:18:40"}
{"current_steps": 710, "total_steps": 980, "loss": 0.0083, "lr": 2.1540416578846207e-06, "epoch": 25.357142857142858, "percentage": 72.45, "elapsed_time": "0:48:54", "remaining_time": "0:18:35"}
{"current_steps": 711, "total_steps": 980, "loss": 0.0091, "lr": 2.139416699389153e-06, "epoch": 25.392857142857142, "percentage": 72.55, "elapsed_time": "0:48:57", "remaining_time": "0:18:31"}
{"current_steps": 712, "total_steps": 980, "loss": 0.0075, "lr": 2.1248280333794347e-06, "epoch": 25.428571428571427, "percentage": 72.65, "elapsed_time": "0:49:01", "remaining_time": "0:18:27"}
{"current_steps": 713, "total_steps": 980, "loss": 0.0075, "lr": 2.1102758449432233e-06, "epoch": 25.464285714285715, "percentage": 72.76, "elapsed_time": "0:49:05", "remaining_time": "0:18:23"}
{"current_steps": 714, "total_steps": 980, "loss": 0.0081, "lr": 2.095760318705487e-06, "epoch": 25.5, "percentage": 72.86, "elapsed_time": "0:49:09", "remaining_time": "0:18:18"}
{"current_steps": 715, "total_steps": 980, "loss": 0.01, "lr": 2.081281638826052e-06, "epoch": 25.535714285714285, "percentage": 72.96, "elapsed_time": "0:49:14", "remaining_time": "0:18:14"}
{"current_steps": 716, "total_steps": 980, "loss": 0.0136, "lr": 2.0668399889972717e-06, "epoch": 25.571428571428573, "percentage": 73.06, "elapsed_time": "0:49:17", "remaining_time": "0:18:10"}
{"current_steps": 717, "total_steps": 980, "loss": 0.009, "lr": 2.0524355524417017e-06, "epoch": 25.607142857142858, "percentage": 73.16, "elapsed_time": "0:49:20", "remaining_time": "0:18:06"}
{"current_steps": 718, "total_steps": 980, "loss": 0.0076, "lr": 2.038068511909762e-06, "epoch": 25.642857142857142, "percentage": 73.27, "elapsed_time": "0:49:24", "remaining_time": "0:18:01"}
{"current_steps": 719, "total_steps": 980, "loss": 0.0108, "lr": 2.0237390496774284e-06, "epoch": 25.678571428571427, "percentage": 73.37, "elapsed_time": "0:49:28", "remaining_time": "0:17:57"}
{"current_steps": 720, "total_steps": 980, "loss": 0.009, "lr": 2.00944734754392e-06, "epoch": 25.714285714285715, "percentage": 73.47, "elapsed_time": "0:49:32", "remaining_time": "0:17:53"}
{"current_steps": 721, "total_steps": 980, "loss": 0.0139, "lr": 1.995193586829387e-06, "epoch": 25.75, "percentage": 73.57, "elapsed_time": "0:49:36", "remaining_time": "0:17:49"}
{"current_steps": 722, "total_steps": 980, "loss": 0.01, "lr": 1.980977948372612e-06, "epoch": 25.785714285714285, "percentage": 73.67, "elapsed_time": "0:49:40", "remaining_time": "0:17:45"}
{"current_steps": 723, "total_steps": 980, "loss": 0.0125, "lr": 1.966800612528723e-06, "epoch": 25.821428571428573, "percentage": 73.78, "elapsed_time": "0:49:44", "remaining_time": "0:17:40"}
{"current_steps": 724, "total_steps": 980, "loss": 0.0115, "lr": 1.952661759166893e-06, "epoch": 25.857142857142858, "percentage": 73.88, "elapsed_time": "0:49:48", "remaining_time": "0:17:36"}
{"current_steps": 725, "total_steps": 980, "loss": 0.0064, "lr": 1.9385615676680663e-06, "epoch": 25.892857142857142, "percentage": 73.98, "elapsed_time": "0:49:51", "remaining_time": "0:17:32"}
{"current_steps": 726, "total_steps": 980, "loss": 0.0117, "lr": 1.9245002169226814e-06, "epoch": 25.928571428571427, "percentage": 74.08, "elapsed_time": "0:49:55", "remaining_time": "0:17:27"}
{"current_steps": 727, "total_steps": 980, "loss": 0.0098, "lr": 1.910477885328399e-06, "epoch": 25.964285714285715, "percentage": 74.18, "elapsed_time": "0:49:58", "remaining_time": "0:17:23"}
{"current_steps": 728, "total_steps": 980, "loss": 0.0086, "lr": 1.8964947507878401e-06, "epoch": 26.0, "percentage": 74.29, "elapsed_time": "0:50:02", "remaining_time": "0:17:19"}
{"current_steps": 729, "total_steps": 980, "loss": 0.0094, "lr": 1.8825509907063328e-06, "epoch": 26.035714285714285, "percentage": 74.39, "elapsed_time": "0:50:06", "remaining_time": "0:17:15"}
{"current_steps": 730, "total_steps": 980, "loss": 0.007, "lr": 1.8686467819896542e-06, "epoch": 26.071428571428573, "percentage": 74.49, "elapsed_time": "0:50:10", "remaining_time": "0:17:10"}
{"current_steps": 731, "total_steps": 980, "loss": 0.0071, "lr": 1.8547823010417876e-06, "epoch": 26.107142857142858, "percentage": 74.59, "elapsed_time": "0:50:13", "remaining_time": "0:17:06"}
{"current_steps": 732, "total_steps": 980, "loss": 0.0092, "lr": 1.8409577237626935e-06, "epoch": 26.142857142857142, "percentage": 74.69, "elapsed_time": "0:50:16", "remaining_time": "0:17:02"}
{"current_steps": 733, "total_steps": 980, "loss": 0.0095, "lr": 1.8271732255460644e-06, "epoch": 26.178571428571427, "percentage": 74.8, "elapsed_time": "0:50:20", "remaining_time": "0:16:57"}
{"current_steps": 734, "total_steps": 980, "loss": 0.0068, "lr": 1.8134289812771077e-06, "epoch": 26.214285714285715, "percentage": 74.9, "elapsed_time": "0:50:24", "remaining_time": "0:16:53"}
{"current_steps": 735, "total_steps": 980, "loss": 0.0058, "lr": 1.7997251653303249e-06, "epoch": 26.25, "percentage": 75.0, "elapsed_time": "0:50:28", "remaining_time": "0:16:49"}
{"current_steps": 736, "total_steps": 980, "loss": 0.0089, "lr": 1.7860619515673034e-06, "epoch": 26.285714285714285, "percentage": 75.1, "elapsed_time": "0:50:31", "remaining_time": "0:16:45"}
{"current_steps": 737, "total_steps": 980, "loss": 0.0078, "lr": 1.7724395133345025e-06, "epoch": 26.321428571428573, "percentage": 75.2, "elapsed_time": "0:50:35", "remaining_time": "0:16:40"}
{"current_steps": 738, "total_steps": 980, "loss": 0.0112, "lr": 1.7588580234610592e-06, "epoch": 26.357142857142858, "percentage": 75.31, "elapsed_time": "0:50:39", "remaining_time": "0:16:36"}
{"current_steps": 739, "total_steps": 980, "loss": 0.0078, "lr": 1.7453176542565958e-06, "epoch": 26.392857142857142, "percentage": 75.41, "elapsed_time": "0:50:42", "remaining_time": "0:16:32"}
{"current_steps": 740, "total_steps": 980, "loss": 0.0084, "lr": 1.7318185775090336e-06, "epoch": 26.428571428571427, "percentage": 75.51, "elapsed_time": "0:50:47", "remaining_time": "0:16:28"}
{"current_steps": 741, "total_steps": 980, "loss": 0.01, "lr": 1.7183609644824096e-06, "epoch": 26.464285714285715, "percentage": 75.61, "elapsed_time": "0:50:51", "remaining_time": "0:16:24"}
{"current_steps": 742, "total_steps": 980, "loss": 0.008, "lr": 1.7049449859147121e-06, "epoch": 26.5, "percentage": 75.71, "elapsed_time": "0:50:55", "remaining_time": "0:16:20"}
{"current_steps": 743, "total_steps": 980, "loss": 0.008, "lr": 1.6915708120157042e-06, "epoch": 26.535714285714285, "percentage": 75.82, "elapsed_time": "0:50:59", "remaining_time": "0:16:15"}
{"current_steps": 744, "total_steps": 980, "loss": 0.0108, "lr": 1.67823861246477e-06, "epoch": 26.571428571428573, "percentage": 75.92, "elapsed_time": "0:51:02", "remaining_time": "0:16:11"}
{"current_steps": 745, "total_steps": 980, "loss": 0.0088, "lr": 1.6649485564087646e-06, "epoch": 26.607142857142858, "percentage": 76.02, "elapsed_time": "0:51:06", "remaining_time": "0:16:07"}
{"current_steps": 746, "total_steps": 980, "loss": 0.0102, "lr": 1.6517008124598622e-06, "epoch": 26.642857142857142, "percentage": 76.12, "elapsed_time": "0:51:10", "remaining_time": "0:16:03"}
{"current_steps": 747, "total_steps": 980, "loss": 0.0123, "lr": 1.6384955486934157e-06, "epoch": 26.678571428571427, "percentage": 76.22, "elapsed_time": "0:51:13", "remaining_time": "0:15:58"}
{"current_steps": 748, "total_steps": 980, "loss": 0.0086, "lr": 1.6253329326458367e-06, "epoch": 26.714285714285715, "percentage": 76.33, "elapsed_time": "0:51:17", "remaining_time": "0:15:54"}
{"current_steps": 749, "total_steps": 980, "loss": 0.0089, "lr": 1.612213131312454e-06, "epoch": 26.75, "percentage": 76.43, "elapsed_time": "0:51:21", "remaining_time": "0:15:50"}
{"current_steps": 750, "total_steps": 980, "loss": 0.009, "lr": 1.5991363111454023e-06, "epoch": 26.785714285714285, "percentage": 76.53, "elapsed_time": "0:51:25", "remaining_time": "0:15:46"}
{"current_steps": 751, "total_steps": 980, "loss": 0.0098, "lr": 1.5861026380515165e-06, "epoch": 26.821428571428573, "percentage": 76.63, "elapsed_time": "0:51:28", "remaining_time": "0:15:41"}
{"current_steps": 752, "total_steps": 980, "loss": 0.0102, "lr": 1.5731122773902147e-06, "epoch": 26.857142857142858, "percentage": 76.73, "elapsed_time": "0:51:32", "remaining_time": "0:15:37"}
{"current_steps": 753, "total_steps": 980, "loss": 0.0098, "lr": 1.5601653939714073e-06, "epoch": 26.892857142857142, "percentage": 76.84, "elapsed_time": "0:51:35", "remaining_time": "0:15:33"}
{"current_steps": 754, "total_steps": 980, "loss": 0.0112, "lr": 1.547262152053406e-06, "epoch": 26.928571428571427, "percentage": 76.94, "elapsed_time": "0:51:39", "remaining_time": "0:15:28"}
{"current_steps": 755, "total_steps": 980, "loss": 0.0097, "lr": 1.5344027153408375e-06, "epoch": 26.964285714285715, "percentage": 77.04, "elapsed_time": "0:51:42", "remaining_time": "0:15:24"}
{"current_steps": 756, "total_steps": 980, "loss": 0.0085, "lr": 1.5215872469825682e-06, "epoch": 27.0, "percentage": 77.14, "elapsed_time": "0:51:46", "remaining_time": "0:15:20"}
{"current_steps": 757, "total_steps": 980, "loss": 0.0086, "lr": 1.5088159095696365e-06, "epoch": 27.035714285714285, "percentage": 77.24, "elapsed_time": "0:51:49", "remaining_time": "0:15:16"}
{"current_steps": 758, "total_steps": 980, "loss": 0.0088, "lr": 1.4960888651331833e-06, "epoch": 27.071428571428573, "percentage": 77.35, "elapsed_time": "0:51:53", "remaining_time": "0:15:12"}
{"current_steps": 759, "total_steps": 980, "loss": 0.008, "lr": 1.4834062751424018e-06, "epoch": 27.107142857142858, "percentage": 77.45, "elapsed_time": "0:51:58", "remaining_time": "0:15:07"}
{"current_steps": 760, "total_steps": 980, "loss": 0.0093, "lr": 1.4707683005024898e-06, "epoch": 27.142857142857142, "percentage": 77.55, "elapsed_time": "0:52:01", "remaining_time": "0:15:03"}
{"current_steps": 761, "total_steps": 980, "loss": 0.007, "lr": 1.4581751015526035e-06, "epoch": 27.178571428571427, "percentage": 77.65, "elapsed_time": "0:52:05", "remaining_time": "0:14:59"}
{"current_steps": 762, "total_steps": 980, "loss": 0.0079, "lr": 1.4456268380638262e-06, "epoch": 27.214285714285715, "percentage": 77.76, "elapsed_time": "0:52:08", "remaining_time": "0:14:55"}
{"current_steps": 763, "total_steps": 980, "loss": 0.0086, "lr": 1.4331236692371386e-06, "epoch": 27.25, "percentage": 77.86, "elapsed_time": "0:52:12", "remaining_time": "0:14:50"}
{"current_steps": 764, "total_steps": 980, "loss": 0.0087, "lr": 1.4206657537014078e-06, "epoch": 27.285714285714285, "percentage": 77.96, "elapsed_time": "0:52:16", "remaining_time": "0:14:46"}
{"current_steps": 765, "total_steps": 980, "loss": 0.0083, "lr": 1.4082532495113627e-06, "epoch": 27.321428571428573, "percentage": 78.06, "elapsed_time": "0:52:19", "remaining_time": "0:14:42"}
{"current_steps": 766, "total_steps": 980, "loss": 0.0068, "lr": 1.3958863141455937e-06, "epoch": 27.357142857142858, "percentage": 78.16, "elapsed_time": "0:52:23", "remaining_time": "0:14:38"}
{"current_steps": 767, "total_steps": 980, "loss": 0.0098, "lr": 1.38356510450456e-06, "epoch": 27.392857142857142, "percentage": 78.27, "elapsed_time": "0:52:27", "remaining_time": "0:14:34"}
{"current_steps": 768, "total_steps": 980, "loss": 0.0126, "lr": 1.3712897769085903e-06, "epoch": 27.428571428571427, "percentage": 78.37, "elapsed_time": "0:52:30", "remaining_time": "0:14:29"}
{"current_steps": 769, "total_steps": 980, "loss": 0.0093, "lr": 1.3590604870959046e-06, "epoch": 27.464285714285715, "percentage": 78.47, "elapsed_time": "0:52:33", "remaining_time": "0:14:25"}
{"current_steps": 770, "total_steps": 980, "loss": 0.011, "lr": 1.3468773902206378e-06, "epoch": 27.5, "percentage": 78.57, "elapsed_time": "0:52:37", "remaining_time": "0:14:21"}
{"current_steps": 771, "total_steps": 980, "loss": 0.0084, "lr": 1.3347406408508695e-06, "epoch": 27.535714285714285, "percentage": 78.67, "elapsed_time": "0:52:40", "remaining_time": "0:14:16"}
{"current_steps": 772, "total_steps": 980, "loss": 0.0082, "lr": 1.322650392966665e-06, "epoch": 27.571428571428573, "percentage": 78.78, "elapsed_time": "0:52:44", "remaining_time": "0:14:12"}
{"current_steps": 773, "total_steps": 980, "loss": 0.0084, "lr": 1.3106067999581224e-06, "epoch": 27.607142857142858, "percentage": 78.88, "elapsed_time": "0:52:48", "remaining_time": "0:14:08"}
{"current_steps": 774, "total_steps": 980, "loss": 0.0076, "lr": 1.298610014623423e-06, "epoch": 27.642857142857142, "percentage": 78.98, "elapsed_time": "0:52:52", "remaining_time": "0:14:04"}
{"current_steps": 775, "total_steps": 980, "loss": 0.0098, "lr": 1.2866601891668945e-06, "epoch": 27.678571428571427, "percentage": 79.08, "elapsed_time": "0:52:56", "remaining_time": "0:14:00"}
{"current_steps": 776, "total_steps": 980, "loss": 0.0077, "lr": 1.2747574751970826e-06, "epoch": 27.714285714285715, "percentage": 79.18, "elapsed_time": "0:53:00", "remaining_time": "0:13:56"}
{"current_steps": 777, "total_steps": 980, "loss": 0.0107, "lr": 1.2629020237248241e-06, "epoch": 27.75, "percentage": 79.29, "elapsed_time": "0:53:04", "remaining_time": "0:13:52"}
{"current_steps": 778, "total_steps": 980, "loss": 0.0096, "lr": 1.2510939851613285e-06, "epoch": 27.785714285714285, "percentage": 79.39, "elapsed_time": "0:53:07", "remaining_time": "0:13:47"}
{"current_steps": 779, "total_steps": 980, "loss": 0.0067, "lr": 1.239333509316281e-06, "epoch": 27.821428571428573, "percentage": 79.49, "elapsed_time": "0:53:11", "remaining_time": "0:13:43"}
{"current_steps": 780, "total_steps": 980, "loss": 0.0088, "lr": 1.2276207453959283e-06, "epoch": 27.857142857142858, "percentage": 79.59, "elapsed_time": "0:53:14", "remaining_time": "0:13:39"}
{"current_steps": 781, "total_steps": 980, "loss": 0.0082, "lr": 1.2159558420011907e-06, "epoch": 27.892857142857142, "percentage": 79.69, "elapsed_time": "0:53:18", "remaining_time": "0:13:34"}
{"current_steps": 782, "total_steps": 980, "loss": 0.0105, "lr": 1.2043389471257833e-06, "epoch": 27.928571428571427, "percentage": 79.8, "elapsed_time": "0:53:22", "remaining_time": "0:13:30"}
{"current_steps": 783, "total_steps": 980, "loss": 0.01, "lr": 1.1927702081543279e-06, "epoch": 27.964285714285715, "percentage": 79.9, "elapsed_time": "0:53:26", "remaining_time": "0:13:26"}
{"current_steps": 784, "total_steps": 980, "loss": 0.0082, "lr": 1.1812497718604887e-06, "epoch": 28.0, "percentage": 80.0, "elapsed_time": "0:53:29", "remaining_time": "0:13:22"}
{"current_steps": 785, "total_steps": 980, "loss": 0.0076, "lr": 1.1697777844051105e-06, "epoch": 28.035714285714285, "percentage": 80.1, "elapsed_time": "0:53:33", "remaining_time": "0:13:18"}
{"current_steps": 786, "total_steps": 980, "loss": 0.0082, "lr": 1.158354391334362e-06, "epoch": 28.071428571428573, "percentage": 80.2, "elapsed_time": "0:53:36", "remaining_time": "0:13:13"}
{"current_steps": 787, "total_steps": 980, "loss": 0.0083, "lr": 1.1469797375778902e-06, "epoch": 28.107142857142858, "percentage": 80.31, "elapsed_time": "0:53:40", "remaining_time": "0:13:09"}
{"current_steps": 788, "total_steps": 980, "loss": 0.0064, "lr": 1.1356539674469852e-06, "epoch": 28.142857142857142, "percentage": 80.41, "elapsed_time": "0:53:44", "remaining_time": "0:13:05"}
{"current_steps": 789, "total_steps": 980, "loss": 0.009, "lr": 1.1243772246327416e-06, "epoch": 28.178571428571427, "percentage": 80.51, "elapsed_time": "0:53:47", "remaining_time": "0:13:01"}
{"current_steps": 790, "total_steps": 980, "loss": 0.0109, "lr": 1.1131496522042424e-06, "epoch": 28.214285714285715, "percentage": 80.61, "elapsed_time": "0:53:51", "remaining_time": "0:12:57"}
{"current_steps": 791, "total_steps": 980, "loss": 0.0083, "lr": 1.1019713926067394e-06, "epoch": 28.25, "percentage": 80.71, "elapsed_time": "0:53:54", "remaining_time": "0:12:52"}
{"current_steps": 792, "total_steps": 980, "loss": 0.0091, "lr": 1.0908425876598512e-06, "epoch": 28.285714285714285, "percentage": 80.82, "elapsed_time": "0:53:59", "remaining_time": "0:12:48"}
{"current_steps": 793, "total_steps": 980, "loss": 0.0093, "lr": 1.0797633785557582e-06, "epoch": 28.321428571428573, "percentage": 80.92, "elapsed_time": "0:54:02", "remaining_time": "0:12:44"}
{"current_steps": 794, "total_steps": 980, "loss": 0.0057, "lr": 1.068733905857413e-06, "epoch": 28.357142857142858, "percentage": 81.02, "elapsed_time": "0:54:05", "remaining_time": "0:12:40"}
{"current_steps": 795, "total_steps": 980, "loss": 0.0063, "lr": 1.0577543094967613e-06, "epoch": 28.392857142857142, "percentage": 81.12, "elapsed_time": "0:54:10", "remaining_time": "0:12:36"}
{"current_steps": 796, "total_steps": 980, "loss": 0.0072, "lr": 1.0468247287729593e-06, "epoch": 28.428571428571427, "percentage": 81.22, "elapsed_time": "0:54:13", "remaining_time": "0:12:32"}
{"current_steps": 797, "total_steps": 980, "loss": 0.0116, "lr": 1.0359453023506123e-06, "epoch": 28.464285714285715, "percentage": 81.33, "elapsed_time": "0:54:17", "remaining_time": "0:12:27"}
{"current_steps": 798, "total_steps": 980, "loss": 0.0074, "lr": 1.0251161682580125e-06, "epoch": 28.5, "percentage": 81.43, "elapsed_time": "0:54:21", "remaining_time": "0:12:23"}
{"current_steps": 799, "total_steps": 980, "loss": 0.0099, "lr": 1.0143374638853892e-06, "epoch": 28.535714285714285, "percentage": 81.53, "elapsed_time": "0:54:24", "remaining_time": "0:12:19"}
{"current_steps": 800, "total_steps": 980, "loss": 0.0106, "lr": 1.0036093259831624e-06, "epoch": 28.571428571428573, "percentage": 81.63, "elapsed_time": "0:54:29", "remaining_time": "0:12:15"}
{"current_steps": 800, "total_steps": 980, "eval_loss": 2.567107677459717, "epoch": 28.571428571428573, "percentage": 81.63, "elapsed_time": "0:54:29", "remaining_time": "0:12:15"}
{"current_steps": 801, "total_steps": 980, "loss": 0.0088, "lr": 9.929318906602176e-07, "epoch": 28.607142857142858, "percentage": 81.73, "elapsed_time": "0:55:18", "remaining_time": "0:12:21"}
{"current_steps": 802, "total_steps": 980, "loss": 0.0067, "lr": 9.823052933821643e-07, "epoch": 28.642857142857142, "percentage": 81.84, "elapsed_time": "0:55:21", "remaining_time": "0:12:17"}
{"current_steps": 803, "total_steps": 980, "loss": 0.0081, "lr": 9.717296689696283e-07, "epoch": 28.678571428571427, "percentage": 81.94, "elapsed_time": "0:55:24", "remaining_time": "0:12:12"}
{"current_steps": 804, "total_steps": 980, "loss": 0.0069, "lr": 9.612051515965388e-07, "epoch": 28.714285714285715, "percentage": 82.04, "elapsed_time": "0:55:28", "remaining_time": "0:12:08"}
{"current_steps": 805, "total_steps": 980, "loss": 0.0107, "lr": 9.507318747884243e-07, "epoch": 28.75, "percentage": 82.14, "elapsed_time": "0:55:32", "remaining_time": "0:12:04"}
{"current_steps": 806, "total_steps": 980, "loss": 0.0137, "lr": 9.403099714207175e-07, "epoch": 28.785714285714285, "percentage": 82.24, "elapsed_time": "0:55:35", "remaining_time": "0:12:00"}
{"current_steps": 807, "total_steps": 980, "loss": 0.0096, "lr": 9.299395737170758e-07, "epoch": 28.821428571428573, "percentage": 82.35, "elapsed_time": "0:55:38", "remaining_time": "0:11:55"}
{"current_steps": 808, "total_steps": 980, "loss": 0.0068, "lr": 9.196208132476963e-07, "epoch": 28.857142857142858, "percentage": 82.45, "elapsed_time": "0:55:42", "remaining_time": "0:11:51"}
{"current_steps": 809, "total_steps": 980, "loss": 0.0074, "lr": 9.093538209276487e-07, "epoch": 28.892857142857142, "percentage": 82.55, "elapsed_time": "0:55:46", "remaining_time": "0:11:47"}
{"current_steps": 810, "total_steps": 980, "loss": 0.0105, "lr": 8.991387270152202e-07, "epoch": 28.928571428571427, "percentage": 82.65, "elapsed_time": "0:55:49", "remaining_time": "0:11:43"}
{"current_steps": 811, "total_steps": 980, "loss": 0.0079, "lr": 8.88975661110254e-07, "epoch": 28.964285714285715, "percentage": 82.76, "elapsed_time": "0:55:53", "remaining_time": "0:11:38"}
{"current_steps": 812, "total_steps": 980, "loss": 0.007, "lr": 8.78864752152509e-07, "epoch": 29.0, "percentage": 82.86, "elapsed_time": "0:55:56", "remaining_time": "0:11:34"}
{"current_steps": 813, "total_steps": 980, "loss": 0.0091, "lr": 8.688061284200266e-07, "epoch": 29.035714285714285, "percentage": 82.96, "elapsed_time": "0:55:59", "remaining_time": "0:11:30"}
{"current_steps": 814, "total_steps": 980, "loss": 0.0087, "lr": 8.587999175274986e-07, "epoch": 29.071428571428573, "percentage": 83.06, "elapsed_time": "0:56:03", "remaining_time": "0:11:25"}
{"current_steps": 815, "total_steps": 980, "loss": 0.0089, "lr": 8.488462464246495e-07, "epoch": 29.107142857142858, "percentage": 83.16, "elapsed_time": "0:56:06", "remaining_time": "0:11:21"}
{"current_steps": 816, "total_steps": 980, "loss": 0.0077, "lr": 8.389452413946314e-07, "epoch": 29.142857142857142, "percentage": 83.27, "elapsed_time": "0:56:11", "remaining_time": "0:11:17"}
{"current_steps": 817, "total_steps": 980, "loss": 0.0088, "lr": 8.290970280524124e-07, "epoch": 29.178571428571427, "percentage": 83.37, "elapsed_time": "0:56:15", "remaining_time": "0:11:13"}
{"current_steps": 818, "total_steps": 980, "loss": 0.0106, "lr": 8.193017313431872e-07, "epoch": 29.214285714285715, "percentage": 83.47, "elapsed_time": "0:56:18", "remaining_time": "0:11:09"}
{"current_steps": 819, "total_steps": 980, "loss": 0.0068, "lr": 8.095594755407971e-07, "epoch": 29.25, "percentage": 83.57, "elapsed_time": "0:56:21", "remaining_time": "0:11:04"}
{"current_steps": 820, "total_steps": 980, "loss": 0.0085, "lr": 7.99870384246143e-07, "epoch": 29.285714285714285, "percentage": 83.67, "elapsed_time": "0:56:26", "remaining_time": "0:11:00"}
{"current_steps": 821, "total_steps": 980, "loss": 0.0075, "lr": 7.902345803856265e-07, "epoch": 29.321428571428573, "percentage": 83.78, "elapsed_time": "0:56:29", "remaining_time": "0:10:56"}
{"current_steps": 822, "total_steps": 980, "loss": 0.0074, "lr": 7.806521862095834e-07, "epoch": 29.357142857142858, "percentage": 83.88, "elapsed_time": "0:56:33", "remaining_time": "0:10:52"}
{"current_steps": 823, "total_steps": 980, "loss": 0.0068, "lr": 7.711233232907401e-07, "epoch": 29.392857142857142, "percentage": 83.98, "elapsed_time": "0:56:36", "remaining_time": "0:10:47"}
{"current_steps": 824, "total_steps": 980, "loss": 0.0087, "lr": 7.616481125226632e-07, "epoch": 29.428571428571427, "percentage": 84.08, "elapsed_time": "0:56:39", "remaining_time": "0:10:43"}
{"current_steps": 825, "total_steps": 980, "loss": 0.0106, "lr": 7.522266741182305e-07, "epoch": 29.464285714285715, "percentage": 84.18, "elapsed_time": "0:56:43", "remaining_time": "0:10:39"}
{"current_steps": 826, "total_steps": 980, "loss": 0.0094, "lr": 7.42859127608106e-07, "epoch": 29.5, "percentage": 84.29, "elapsed_time": "0:56:47", "remaining_time": "0:10:35"}
{"current_steps": 827, "total_steps": 980, "loss": 0.0114, "lr": 7.33545591839222e-07, "epoch": 29.535714285714285, "percentage": 84.39, "elapsed_time": "0:56:51", "remaining_time": "0:10:31"}
{"current_steps": 828, "total_steps": 980, "loss": 0.0069, "lr": 7.242861849732696e-07, "epoch": 29.571428571428573, "percentage": 84.49, "elapsed_time": "0:56:55", "remaining_time": "0:10:26"}
{"current_steps": 829, "total_steps": 980, "loss": 0.0075, "lr": 7.150810244852036e-07, "epoch": 29.607142857142858, "percentage": 84.59, "elapsed_time": "0:56:59", "remaining_time": "0:10:22"}
{"current_steps": 830, "total_steps": 980, "loss": 0.0067, "lr": 7.059302271617485e-07, "epoch": 29.642857142857142, "percentage": 84.69, "elapsed_time": "0:57:02", "remaining_time": "0:10:18"}
{"current_steps": 831, "total_steps": 980, "loss": 0.0094, "lr": 6.968339090999188e-07, "epoch": 29.678571428571427, "percentage": 84.8, "elapsed_time": "0:57:06", "remaining_time": "0:10:14"}
{"current_steps": 832, "total_steps": 980, "loss": 0.0068, "lr": 6.877921857055476e-07, "epoch": 29.714285714285715, "percentage": 84.9, "elapsed_time": "0:57:10", "remaining_time": "0:10:10"}
{"current_steps": 833, "total_steps": 980, "loss": 0.009, "lr": 6.78805171691817e-07, "epoch": 29.75, "percentage": 85.0, "elapsed_time": "0:57:14", "remaining_time": "0:10:06"}
{"current_steps": 834, "total_steps": 980, "loss": 0.0088, "lr": 6.698729810778065e-07, "epoch": 29.785714285714285, "percentage": 85.1, "elapsed_time": "0:57:17", "remaining_time": "0:10:01"}
{"current_steps": 835, "total_steps": 980, "loss": 0.0087, "lr": 6.609957271870505e-07, "epoch": 29.821428571428573, "percentage": 85.2, "elapsed_time": "0:57:21", "remaining_time": "0:09:57"}
{"current_steps": 836, "total_steps": 980, "loss": 0.0065, "lr": 6.521735226460901e-07, "epoch": 29.857142857142858, "percentage": 85.31, "elapsed_time": "0:57:25", "remaining_time": "0:09:53"}
{"current_steps": 837, "total_steps": 980, "loss": 0.0107, "lr": 6.43406479383053e-07, "epoch": 29.892857142857142, "percentage": 85.41, "elapsed_time": "0:57:28", "remaining_time": "0:09:49"}
{"current_steps": 838, "total_steps": 980, "loss": 0.007, "lr": 6.346947086262323e-07, "epoch": 29.928571428571427, "percentage": 85.51, "elapsed_time": "0:57:32", "remaining_time": "0:09:44"}
{"current_steps": 839, "total_steps": 980, "loss": 0.0103, "lr": 6.260383209026704e-07, "epoch": 29.964285714285715, "percentage": 85.61, "elapsed_time": "0:57:35", "remaining_time": "0:09:40"}
{"current_steps": 840, "total_steps": 980, "loss": 0.0093, "lr": 6.174374260367611e-07, "epoch": 30.0, "percentage": 85.71, "elapsed_time": "0:57:38", "remaining_time": "0:09:36"}
{"current_steps": 841, "total_steps": 980, "loss": 0.0097, "lr": 6.088921331488568e-07, "epoch": 30.035714285714285, "percentage": 85.82, "elapsed_time": "0:57:42", "remaining_time": "0:09:32"}
{"current_steps": 842, "total_steps": 980, "loss": 0.0065, "lr": 6.004025506538813e-07, "epoch": 30.071428571428573, "percentage": 85.92, "elapsed_time": "0:57:46", "remaining_time": "0:09:28"}
{"current_steps": 843, "total_steps": 980, "loss": 0.008, "lr": 5.919687862599549e-07, "epoch": 30.107142857142858, "percentage": 86.02, "elapsed_time": "0:57:50", "remaining_time": "0:09:23"}
{"current_steps": 844, "total_steps": 980, "loss": 0.0091, "lr": 5.835909469670292e-07, "epoch": 30.142857142857142, "percentage": 86.12, "elapsed_time": "0:57:54", "remaining_time": "0:09:19"}
{"current_steps": 845, "total_steps": 980, "loss": 0.005, "lr": 5.752691390655279e-07, "epoch": 30.178571428571427, "percentage": 86.22, "elapsed_time": "0:57:57", "remaining_time": "0:09:15"}
{"current_steps": 846, "total_steps": 980, "loss": 0.008, "lr": 5.670034681349995e-07, "epoch": 30.214285714285715, "percentage": 86.33, "elapsed_time": "0:58:00", "remaining_time": "0:09:11"}
{"current_steps": 847, "total_steps": 980, "loss": 0.0068, "lr": 5.587940390427804e-07, "epoch": 30.25, "percentage": 86.43, "elapsed_time": "0:58:04", "remaining_time": "0:09:07"}
{"current_steps": 848, "total_steps": 980, "loss": 0.0101, "lr": 5.506409559426573e-07, "epoch": 30.285714285714285, "percentage": 86.53, "elapsed_time": "0:58:07", "remaining_time": "0:09:02"}
{"current_steps": 849, "total_steps": 980, "loss": 0.0078, "lr": 5.425443222735527e-07, "epoch": 30.321428571428573, "percentage": 86.63, "elapsed_time": "0:58:10", "remaining_time": "0:08:58"}
{"current_steps": 850, "total_steps": 980, "loss": 0.009, "lr": 5.345042407582079e-07, "epoch": 30.357142857142858, "percentage": 86.73, "elapsed_time": "0:58:13", "remaining_time": "0:08:54"}
{"current_steps": 851, "total_steps": 980, "loss": 0.0063, "lr": 5.265208134018851e-07, "epoch": 30.392857142857142, "percentage": 86.84, "elapsed_time": "0:58:17", "remaining_time": "0:08:50"}
{"current_steps": 852, "total_steps": 980, "loss": 0.0095, "lr": 5.185941414910673e-07, "epoch": 30.428571428571427, "percentage": 86.94, "elapsed_time": "0:58:22", "remaining_time": "0:08:46"}
{"current_steps": 853, "total_steps": 980, "loss": 0.008, "lr": 5.107243255921746e-07, "epoch": 30.464285714285715, "percentage": 87.04, "elapsed_time": "0:58:25", "remaining_time": "0:08:41"}
{"current_steps": 854, "total_steps": 980, "loss": 0.0081, "lr": 5.029114655502937e-07, "epoch": 30.5, "percentage": 87.14, "elapsed_time": "0:58:29", "remaining_time": "0:08:37"}
{"current_steps": 855, "total_steps": 980, "loss": 0.0092, "lr": 4.951556604879049e-07, "epoch": 30.535714285714285, "percentage": 87.24, "elapsed_time": "0:58:32", "remaining_time": "0:08:33"}
{"current_steps": 856, "total_steps": 980, "loss": 0.01, "lr": 4.874570088036252e-07, "epoch": 30.571428571428573, "percentage": 87.35, "elapsed_time": "0:58:36", "remaining_time": "0:08:29"}
{"current_steps": 857, "total_steps": 980, "loss": 0.0085, "lr": 4.798156081709638e-07, "epoch": 30.607142857142858, "percentage": 87.45, "elapsed_time": "0:58:39", "remaining_time": "0:08:25"}
{"current_steps": 858, "total_steps": 980, "loss": 0.0095, "lr": 4.722315555370793e-07, "epoch": 30.642857142857142, "percentage": 87.55, "elapsed_time": "0:58:42", "remaining_time": "0:08:20"}
{"current_steps": 859, "total_steps": 980, "loss": 0.0079, "lr": 4.647049471215498e-07, "epoch": 30.678571428571427, "percentage": 87.65, "elapsed_time": "0:58:46", "remaining_time": "0:08:16"}
{"current_steps": 860, "total_steps": 980, "loss": 0.0082, "lr": 4.5723587841515707e-07, "epoch": 30.714285714285715, "percentage": 87.76, "elapsed_time": "0:58:50", "remaining_time": "0:08:12"}
{"current_steps": 861, "total_steps": 980, "loss": 0.0088, "lr": 4.4982444417866753e-07, "epoch": 30.75, "percentage": 87.86, "elapsed_time": "0:58:54", "remaining_time": "0:08:08"}
{"current_steps": 862, "total_steps": 980, "loss": 0.0096, "lr": 4.4247073844163434e-07, "epoch": 30.785714285714285, "percentage": 87.96, "elapsed_time": "0:58:58", "remaining_time": "0:08:04"}
{"current_steps": 863, "total_steps": 980, "loss": 0.0086, "lr": 4.351748545012058e-07, "epoch": 30.821428571428573, "percentage": 88.06, "elapsed_time": "0:59:01", "remaining_time": "0:08:00"}
{"current_steps": 864, "total_steps": 980, "loss": 0.0096, "lr": 4.279368849209381e-07, "epoch": 30.857142857142858, "percentage": 88.16, "elapsed_time": "0:59:06", "remaining_time": "0:07:56"}
{"current_steps": 865, "total_steps": 980, "loss": 0.0085, "lr": 4.2075692152962145e-07, "epoch": 30.892857142857142, "percentage": 88.27, "elapsed_time": "0:59:09", "remaining_time": "0:07:51"}
{"current_steps": 866, "total_steps": 980, "loss": 0.0087, "lr": 4.136350554201196e-07, "epoch": 30.928571428571427, "percentage": 88.37, "elapsed_time": "0:59:12", "remaining_time": "0:07:47"}
{"current_steps": 867, "total_steps": 980, "loss": 0.0081, "lr": 4.0657137694820826e-07, "epoch": 30.964285714285715, "percentage": 88.47, "elapsed_time": "0:59:16", "remaining_time": "0:07:43"}
{"current_steps": 868, "total_steps": 980, "loss": 0.0089, "lr": 3.9956597573142966e-07, "epoch": 31.0, "percentage": 88.57, "elapsed_time": "0:59:19", "remaining_time": "0:07:39"}
{"current_steps": 869, "total_steps": 980, "loss": 0.0079, "lr": 3.9261894064796136e-07, "epoch": 31.035714285714285, "percentage": 88.67, "elapsed_time": "0:59:23", "remaining_time": "0:07:35"}
{"current_steps": 870, "total_steps": 980, "loss": 0.0073, "lr": 3.8573035983548167e-07, "epoch": 31.071428571428573, "percentage": 88.78, "elapsed_time": "0:59:27", "remaining_time": "0:07:31"}
{"current_steps": 871, "total_steps": 980, "loss": 0.0072, "lr": 3.789003206900538e-07, "epoch": 31.107142857142858, "percentage": 88.88, "elapsed_time": "0:59:30", "remaining_time": "0:07:26"}
{"current_steps": 872, "total_steps": 980, "loss": 0.0082, "lr": 3.7212890986501773e-07, "epoch": 31.142857142857142, "percentage": 88.98, "elapsed_time": "0:59:33", "remaining_time": "0:07:22"}
{"current_steps": 873, "total_steps": 980, "loss": 0.0107, "lr": 3.6541621326989183e-07, "epoch": 31.178571428571427, "percentage": 89.08, "elapsed_time": "0:59:37", "remaining_time": "0:07:18"}
{"current_steps": 874, "total_steps": 980, "loss": 0.0071, "lr": 3.5876231606927936e-07, "epoch": 31.214285714285715, "percentage": 89.18, "elapsed_time": "0:59:41", "remaining_time": "0:07:14"}
{"current_steps": 875, "total_steps": 980, "loss": 0.0085, "lr": 3.5216730268179346e-07, "epoch": 31.25, "percentage": 89.29, "elapsed_time": "0:59:44", "remaining_time": "0:07:10"}
{"current_steps": 876, "total_steps": 980, "loss": 0.0075, "lr": 3.4563125677897936e-07, "epoch": 31.285714285714285, "percentage": 89.39, "elapsed_time": "0:59:48", "remaining_time": "0:07:05"}
{"current_steps": 877, "total_steps": 980, "loss": 0.0077, "lr": 3.3915426128425744e-07, "epoch": 31.321428571428573, "percentage": 89.49, "elapsed_time": "0:59:51", "remaining_time": "0:07:01"}
{"current_steps": 878, "total_steps": 980, "loss": 0.007, "lr": 3.327363983718723e-07, "epoch": 31.357142857142858, "percentage": 89.59, "elapsed_time": "0:59:55", "remaining_time": "0:06:57"}
{"current_steps": 879, "total_steps": 980, "loss": 0.0106, "lr": 3.263777494658449e-07, "epoch": 31.392857142857142, "percentage": 89.69, "elapsed_time": "0:59:58", "remaining_time": "0:06:53"}
{"current_steps": 880, "total_steps": 980, "loss": 0.0091, "lr": 3.200783952389447e-07, "epoch": 31.428571428571427, "percentage": 89.8, "elapsed_time": "1:00:02", "remaining_time": "0:06:49"}
{"current_steps": 881, "total_steps": 980, "loss": 0.0083, "lr": 3.138384156116614e-07, "epoch": 31.464285714285715, "percentage": 89.9, "elapsed_time": "1:00:05", "remaining_time": "0:06:45"}
{"current_steps": 882, "total_steps": 980, "loss": 0.0083, "lr": 3.076578897511978e-07, "epoch": 31.5, "percentage": 90.0, "elapsed_time": "1:00:10", "remaining_time": "0:06:41"}
{"current_steps": 883, "total_steps": 980, "loss": 0.0093, "lr": 3.015368960704584e-07, "epoch": 31.535714285714285, "percentage": 90.1, "elapsed_time": "1:00:13", "remaining_time": "0:06:36"}
{"current_steps": 884, "total_steps": 980, "loss": 0.0107, "lr": 2.954755122270564e-07, "epoch": 31.571428571428573, "percentage": 90.2, "elapsed_time": "1:00:17", "remaining_time": "0:06:32"}
{"current_steps": 885, "total_steps": 980, "loss": 0.0094, "lr": 2.894738151223331e-07, "epoch": 31.607142857142858, "percentage": 90.31, "elapsed_time": "1:00:21", "remaining_time": "0:06:28"}
{"current_steps": 886, "total_steps": 980, "loss": 0.0054, "lr": 2.835318809003751e-07, "epoch": 31.642857142857142, "percentage": 90.41, "elapsed_time": "1:00:25", "remaining_time": "0:06:24"}
{"current_steps": 887, "total_steps": 980, "loss": 0.0071, "lr": 2.776497849470544e-07, "epoch": 31.678571428571427, "percentage": 90.51, "elapsed_time": "1:00:28", "remaining_time": "0:06:20"}
{"current_steps": 888, "total_steps": 980, "loss": 0.0069, "lr": 2.71827601889067e-07, "epoch": 31.714285714285715, "percentage": 90.61, "elapsed_time": "1:00:32", "remaining_time": "0:06:16"}
{"current_steps": 889, "total_steps": 980, "loss": 0.0079, "lr": 2.6606540559298956e-07, "epoch": 31.75, "percentage": 90.71, "elapsed_time": "1:00:35", "remaining_time": "0:06:12"}
{"current_steps": 890, "total_steps": 980, "loss": 0.0081, "lr": 2.6036326916434153e-07, "epoch": 31.785714285714285, "percentage": 90.82, "elapsed_time": "1:00:39", "remaining_time": "0:06:08"}
{"current_steps": 891, "total_steps": 980, "loss": 0.0067, "lr": 2.547212649466568e-07, "epoch": 31.821428571428573, "percentage": 90.92, "elapsed_time": "1:00:43", "remaining_time": "0:06:03"}
{"current_steps": 892, "total_steps": 980, "loss": 0.0084, "lr": 2.491394645205669e-07, "epoch": 31.857142857142858, "percentage": 91.02, "elapsed_time": "1:00:46", "remaining_time": "0:05:59"}
{"current_steps": 893, "total_steps": 980, "loss": 0.0079, "lr": 2.436179387028903e-07, "epoch": 31.892857142857142, "percentage": 91.12, "elapsed_time": "1:00:50", "remaining_time": "0:05:55"}
{"current_steps": 894, "total_steps": 980, "loss": 0.0088, "lr": 2.3815675754573885e-07, "epoch": 31.928571428571427, "percentage": 91.22, "elapsed_time": "1:00:53", "remaining_time": "0:05:51"}
{"current_steps": 895, "total_steps": 980, "loss": 0.0102, "lr": 2.3275599033562414e-07, "epoch": 31.964285714285715, "percentage": 91.33, "elapsed_time": "1:00:56", "remaining_time": "0:05:47"}
{"current_steps": 896, "total_steps": 980, "loss": 0.007, "lr": 2.274157055925802e-07, "epoch": 32.0, "percentage": 91.43, "elapsed_time": "1:01:00", "remaining_time": "0:05:43"}
{"current_steps": 897, "total_steps": 980, "loss": 0.0093, "lr": 2.2213597106929608e-07, "epoch": 32.035714285714285, "percentage": 91.53, "elapsed_time": "1:01:03", "remaining_time": "0:05:38"}
{"current_steps": 898, "total_steps": 980, "loss": 0.007, "lr": 2.1691685375025362e-07, "epoch": 32.07142857142857, "percentage": 91.63, "elapsed_time": "1:01:07", "remaining_time": "0:05:34"}
{"current_steps": 899, "total_steps": 980, "loss": 0.0079, "lr": 2.117584198508771e-07, "epoch": 32.107142857142854, "percentage": 91.73, "elapsed_time": "1:01:10", "remaining_time": "0:05:30"}
{"current_steps": 900, "total_steps": 980, "loss": 0.0086, "lr": 2.0666073481669714e-07, "epoch": 32.142857142857146, "percentage": 91.84, "elapsed_time": "1:01:14", "remaining_time": "0:05:26"}
{"current_steps": 900, "total_steps": 980, "eval_loss": 2.5882554054260254, "epoch": 32.142857142857146, "percentage": 91.84, "elapsed_time": "1:01:15", "remaining_time": "0:05:26"}
{"current_steps": 901, "total_steps": 980, "loss": 0.008, "lr": 2.016238633225165e-07, "epoch": 32.17857142857143, "percentage": 91.94, "elapsed_time": "1:02:05", "remaining_time": "0:05:26"}
{"current_steps": 902, "total_steps": 980, "loss": 0.008, "lr": 1.9664786927159064e-07, "epoch": 32.214285714285715, "percentage": 92.04, "elapsed_time": "1:02:08", "remaining_time": "0:05:22"}
{"current_steps": 903, "total_steps": 980, "loss": 0.01, "lr": 1.9173281579481896e-07, "epoch": 32.25, "percentage": 92.14, "elapsed_time": "1:02:13", "remaining_time": "0:05:18"}
{"current_steps": 904, "total_steps": 980, "loss": 0.0065, "lr": 1.8687876524993987e-07, "epoch": 32.285714285714285, "percentage": 92.24, "elapsed_time": "1:02:16", "remaining_time": "0:05:14"}
{"current_steps": 905, "total_steps": 980, "loss": 0.0072, "lr": 1.820857792207431e-07, "epoch": 32.32142857142857, "percentage": 92.35, "elapsed_time": "1:02:20", "remaining_time": "0:05:09"}
{"current_steps": 906, "total_steps": 980, "loss": 0.0105, "lr": 1.7735391851628814e-07, "epoch": 32.357142857142854, "percentage": 92.45, "elapsed_time": "1:02:24", "remaining_time": "0:05:05"}
{"current_steps": 907, "total_steps": 980, "loss": 0.0076, "lr": 1.7268324317012974e-07, "epoch": 32.392857142857146, "percentage": 92.55, "elapsed_time": "1:02:27", "remaining_time": "0:05:01"}
{"current_steps": 908, "total_steps": 980, "loss": 0.0069, "lr": 1.680738124395598e-07, "epoch": 32.42857142857143, "percentage": 92.65, "elapsed_time": "1:02:30", "remaining_time": "0:04:57"}
{"current_steps": 909, "total_steps": 980, "loss": 0.0063, "lr": 1.6352568480485277e-07, "epoch": 32.464285714285715, "percentage": 92.76, "elapsed_time": "1:02:33", "remaining_time": "0:04:53"}
{"current_steps": 910, "total_steps": 980, "loss": 0.0098, "lr": 1.5903891796852756e-07, "epoch": 32.5, "percentage": 92.86, "elapsed_time": "1:02:38", "remaining_time": "0:04:49"}
{"current_steps": 911, "total_steps": 980, "loss": 0.0068, "lr": 1.5461356885461077e-07, "epoch": 32.535714285714285, "percentage": 92.96, "elapsed_time": "1:02:41", "remaining_time": "0:04:44"}
{"current_steps": 912, "total_steps": 980, "loss": 0.0064, "lr": 1.5024969360791564e-07, "epoch": 32.57142857142857, "percentage": 93.06, "elapsed_time": "1:02:44", "remaining_time": "0:04:40"}
{"current_steps": 913, "total_steps": 980, "loss": 0.0075, "lr": 1.4594734759333484e-07, "epoch": 32.607142857142854, "percentage": 93.16, "elapsed_time": "1:02:47", "remaining_time": "0:04:36"}
{"current_steps": 914, "total_steps": 980, "loss": 0.008, "lr": 1.4170658539512993e-07, "epoch": 32.642857142857146, "percentage": 93.27, "elapsed_time": "1:02:52", "remaining_time": "0:04:32"}
{"current_steps": 915, "total_steps": 980, "loss": 0.0085, "lr": 1.375274608162447e-07, "epoch": 32.67857142857143, "percentage": 93.37, "elapsed_time": "1:02:55", "remaining_time": "0:04:28"}
{"current_steps": 916, "total_steps": 980, "loss": 0.0074, "lr": 1.3341002687762062e-07, "epoch": 32.714285714285715, "percentage": 93.47, "elapsed_time": "1:02:58", "remaining_time": "0:04:24"}
{"current_steps": 917, "total_steps": 980, "loss": 0.0082, "lr": 1.2935433581752365e-07, "epoch": 32.75, "percentage": 93.57, "elapsed_time": "1:03:01", "remaining_time": "0:04:19"}
{"current_steps": 918, "total_steps": 980, "loss": 0.008, "lr": 1.253604390908819e-07, "epoch": 32.785714285714285, "percentage": 93.67, "elapsed_time": "1:03:06", "remaining_time": "0:04:15"}
{"current_steps": 919, "total_steps": 980, "loss": 0.0097, "lr": 1.2142838736863562e-07, "epoch": 32.82142857142857, "percentage": 93.78, "elapsed_time": "1:03:09", "remaining_time": "0:04:11"}
{"current_steps": 920, "total_steps": 980, "loss": 0.0094, "lr": 1.175582305370887e-07, "epoch": 32.857142857142854, "percentage": 93.88, "elapsed_time": "1:03:12", "remaining_time": "0:04:07"}
{"current_steps": 921, "total_steps": 980, "loss": 0.0092, "lr": 1.1375001769728e-07, "epoch": 32.892857142857146, "percentage": 93.98, "elapsed_time": "1:03:17", "remaining_time": "0:04:03"}
{"current_steps": 922, "total_steps": 980, "loss": 0.0069, "lr": 1.1000379716435916e-07, "epoch": 32.92857142857143, "percentage": 94.08, "elapsed_time": "1:03:21", "remaining_time": "0:03:59"}
{"current_steps": 923, "total_steps": 980, "loss": 0.0101, "lr": 1.0631961646697387e-07, "epoch": 32.964285714285715, "percentage": 94.18, "elapsed_time": "1:03:24", "remaining_time": "0:03:54"}
{"current_steps": 924, "total_steps": 980, "loss": 0.009, "lr": 1.0269752234666642e-07, "epoch": 33.0, "percentage": 94.29, "elapsed_time": "1:03:27", "remaining_time": "0:03:50"}
{"current_steps": 925, "total_steps": 980, "loss": 0.0078, "lr": 9.913756075728088e-08, "epoch": 33.035714285714285, "percentage": 94.39, "elapsed_time": "1:03:32", "remaining_time": "0:03:46"}
{"current_steps": 926, "total_steps": 980, "loss": 0.0104, "lr": 9.563977686438019e-08, "epoch": 33.07142857142857, "percentage": 94.49, "elapsed_time": "1:03:35", "remaining_time": "0:03:42"}
{"current_steps": 927, "total_steps": 980, "loss": 0.0093, "lr": 9.22042150446728e-08, "epoch": 33.107142857142854, "percentage": 94.59, "elapsed_time": "1:03:39", "remaining_time": "0:03:38"}
{"current_steps": 928, "total_steps": 980, "loss": 0.0077, "lr": 8.883091888545136e-08, "epoch": 33.142857142857146, "percentage": 94.69, "elapsed_time": "1:03:42", "remaining_time": "0:03:34"}
{"current_steps": 929, "total_steps": 980, "loss": 0.0105, "lr": 8.551993118403656e-08, "epoch": 33.17857142857143, "percentage": 94.8, "elapsed_time": "1:03:45", "remaining_time": "0:03:30"}
{"current_steps": 930, "total_steps": 980, "loss": 0.0082, "lr": 8.227129394723643e-08, "epoch": 33.214285714285715, "percentage": 94.9, "elapsed_time": "1:03:49", "remaining_time": "0:03:25"}
{"current_steps": 931, "total_steps": 980, "loss": 0.0071, "lr": 7.908504839081343e-08, "epoch": 33.25, "percentage": 95.0, "elapsed_time": "1:03:53", "remaining_time": "0:03:21"}
{"current_steps": 932, "total_steps": 980, "loss": 0.007, "lr": 7.59612349389599e-08, "epoch": 33.285714285714285, "percentage": 95.1, "elapsed_time": "1:03:57", "remaining_time": "0:03:17"}
{"current_steps": 933, "total_steps": 980, "loss": 0.0062, "lr": 7.289989322378732e-08, "epoch": 33.32142857142857, "percentage": 95.2, "elapsed_time": "1:04:00", "remaining_time": "0:03:13"}
{"current_steps": 934, "total_steps": 980, "loss": 0.0077, "lr": 6.990106208482227e-08, "epoch": 33.357142857142854, "percentage": 95.31, "elapsed_time": "1:04:05", "remaining_time": "0:03:09"}
{"current_steps": 935, "total_steps": 980, "loss": 0.0095, "lr": 6.696477956851356e-08, "epoch": 33.392857142857146, "percentage": 95.41, "elapsed_time": "1:04:08", "remaining_time": "0:03:05"}
{"current_steps": 936, "total_steps": 980, "loss": 0.0109, "lr": 6.409108292774912e-08, "epoch": 33.42857142857143, "percentage": 95.51, "elapsed_time": "1:04:12", "remaining_time": "0:03:01"}
{"current_steps": 937, "total_steps": 980, "loss": 0.0083, "lr": 6.12800086213866e-08, "epoch": 33.464285714285715, "percentage": 95.61, "elapsed_time": "1:04:15", "remaining_time": "0:02:56"}
{"current_steps": 938, "total_steps": 980, "loss": 0.0078, "lr": 5.853159231378469e-08, "epoch": 33.5, "percentage": 95.71, "elapsed_time": "1:04:19", "remaining_time": "0:02:52"}
{"current_steps": 939, "total_steps": 980, "loss": 0.0104, "lr": 5.584586887435739e-08, "epoch": 33.535714285714285, "percentage": 95.82, "elapsed_time": "1:04:23", "remaining_time": "0:02:48"}
{"current_steps": 940, "total_steps": 980, "loss": 0.0055, "lr": 5.322287237712664e-08, "epoch": 33.57142857142857, "percentage": 95.92, "elapsed_time": "1:04:26", "remaining_time": "0:02:44"}
{"current_steps": 941, "total_steps": 980, "loss": 0.0087, "lr": 5.0662636100292094e-08, "epoch": 33.607142857142854, "percentage": 96.02, "elapsed_time": "1:04:31", "remaining_time": "0:02:40"}
{"current_steps": 942, "total_steps": 980, "loss": 0.0063, "lr": 4.8165192525809754e-08, "epoch": 33.642857142857146, "percentage": 96.12, "elapsed_time": "1:04:34", "remaining_time": "0:02:36"}
{"current_steps": 943, "total_steps": 980, "loss": 0.0072, "lr": 4.573057333897679e-08, "epoch": 33.67857142857143, "percentage": 96.22, "elapsed_time": "1:04:38", "remaining_time": "0:02:32"}
{"current_steps": 944, "total_steps": 980, "loss": 0.0088, "lr": 4.335880942803405e-08, "epoch": 33.714285714285715, "percentage": 96.33, "elapsed_time": "1:04:42", "remaining_time": "0:02:28"}
{"current_steps": 945, "total_steps": 980, "loss": 0.0081, "lr": 4.104993088376974e-08, "epoch": 33.75, "percentage": 96.43, "elapsed_time": "1:04:45", "remaining_time": "0:02:23"}
{"current_steps": 946, "total_steps": 980, "loss": 0.0059, "lr": 3.8803966999139686e-08, "epoch": 33.785714285714285, "percentage": 96.53, "elapsed_time": "1:04:49", "remaining_time": "0:02:19"}
{"current_steps": 947, "total_steps": 980, "loss": 0.0067, "lr": 3.662094626889656e-08, "epoch": 33.82142857142857, "percentage": 96.63, "elapsed_time": "1:04:52", "remaining_time": "0:02:15"}
{"current_steps": 948, "total_steps": 980, "loss": 0.008, "lr": 3.450089638922738e-08, "epoch": 33.857142857142854, "percentage": 96.73, "elapsed_time": "1:04:55", "remaining_time": "0:02:11"}
{"current_steps": 949, "total_steps": 980, "loss": 0.008, "lr": 3.2443844257400434e-08, "epoch": 33.892857142857146, "percentage": 96.84, "elapsed_time": "1:04:59", "remaining_time": "0:02:07"}
{"current_steps": 950, "total_steps": 980, "loss": 0.0096, "lr": 3.044981597142837e-08, "epoch": 33.92857142857143, "percentage": 96.94, "elapsed_time": "1:05:04", "remaining_time": "0:02:03"}
{"current_steps": 951, "total_steps": 980, "loss": 0.0081, "lr": 2.8518836829732332e-08, "epoch": 33.964285714285715, "percentage": 97.04, "elapsed_time": "1:05:07", "remaining_time": "0:01:59"}
{"current_steps": 952, "total_steps": 980, "loss": 0.0083, "lr": 2.6650931330823305e-08, "epoch": 34.0, "percentage": 97.14, "elapsed_time": "1:05:12", "remaining_time": "0:01:55"}
{"current_steps": 953, "total_steps": 980, "loss": 0.0086, "lr": 2.4846123172992953e-08, "epoch": 34.035714285714285, "percentage": 97.24, "elapsed_time": "1:05:16", "remaining_time": "0:01:50"}
{"current_steps": 954, "total_steps": 980, "loss": 0.0073, "lr": 2.3104435254008852e-08, "epoch": 34.07142857142857, "percentage": 97.35, "elapsed_time": "1:05:20", "remaining_time": "0:01:46"}
{"current_steps": 955, "total_steps": 980, "loss": 0.0053, "lr": 2.1425889670827483e-08, "epoch": 34.107142857142854, "percentage": 97.45, "elapsed_time": "1:05:24", "remaining_time": "0:01:42"}
{"current_steps": 956, "total_steps": 980, "loss": 0.007, "lr": 1.981050771931281e-08, "epoch": 34.142857142857146, "percentage": 97.55, "elapsed_time": "1:05:27", "remaining_time": "0:01:38"}
{"current_steps": 957, "total_steps": 980, "loss": 0.0087, "lr": 1.8258309893965375e-08, "epoch": 34.17857142857143, "percentage": 97.65, "elapsed_time": "1:05:31", "remaining_time": "0:01:34"}
{"current_steps": 958, "total_steps": 980, "loss": 0.0082, "lr": 1.6769315887662508e-08, "epoch": 34.214285714285715, "percentage": 97.76, "elapsed_time": "1:05:34", "remaining_time": "0:01:30"}
{"current_steps": 959, "total_steps": 980, "loss": 0.0088, "lr": 1.5343544591409632e-08, "epoch": 34.25, "percentage": 97.86, "elapsed_time": "1:05:38", "remaining_time": "0:01:26"}
{"current_steps": 960, "total_steps": 980, "loss": 0.0097, "lr": 1.3981014094099354e-08, "epoch": 34.285714285714285, "percentage": 97.96, "elapsed_time": "1:05:41", "remaining_time": "0:01:22"}
{"current_steps": 961, "total_steps": 980, "loss": 0.01, "lr": 1.2681741682282755e-08, "epoch": 34.32142857142857, "percentage": 98.06, "elapsed_time": "1:05:45", "remaining_time": "0:01:18"}
{"current_steps": 962, "total_steps": 980, "loss": 0.0096, "lr": 1.1445743839949008e-08, "epoch": 34.357142857142854, "percentage": 98.16, "elapsed_time": "1:05:49", "remaining_time": "0:01:13"}
{"current_steps": 963, "total_steps": 980, "loss": 0.0098, "lr": 1.0273036248318325e-08, "epoch": 34.392857142857146, "percentage": 98.27, "elapsed_time": "1:05:52", "remaining_time": "0:01:09"}
{"current_steps": 964, "total_steps": 980, "loss": 0.0084, "lr": 9.163633785639892e-09, "epoch": 34.42857142857143, "percentage": 98.37, "elapsed_time": "1:05:56", "remaining_time": "0:01:05"}
{"current_steps": 965, "total_steps": 980, "loss": 0.0089, "lr": 8.117550527005913e-09, "epoch": 34.464285714285715, "percentage": 98.47, "elapsed_time": "1:05:59", "remaining_time": "0:01:01"}
{"current_steps": 966, "total_steps": 980, "loss": 0.0073, "lr": 7.13479974417175e-09, "epoch": 34.5, "percentage": 98.57, "elapsed_time": "1:06:04", "remaining_time": "0:00:57"}
{"current_steps": 967, "total_steps": 980, "loss": 0.0083, "lr": 6.215393905388278e-09, "epoch": 34.535714285714285, "percentage": 98.67, "elapsed_time": "1:06:08", "remaining_time": "0:00:53"}
{"current_steps": 968, "total_steps": 980, "loss": 0.007, "lr": 5.359344675242018e-09, "epoch": 34.57142857142857, "percentage": 98.78, "elapsed_time": "1:06:12", "remaining_time": "0:00:49"}
{"current_steps": 969, "total_steps": 980, "loss": 0.0104, "lr": 4.56666291450858e-09, "epoch": 34.607142857142854, "percentage": 98.88, "elapsed_time": "1:06:15", "remaining_time": "0:00:45"}
{"current_steps": 970, "total_steps": 980, "loss": 0.0087, "lr": 3.837358680016112e-09, "epoch": 34.642857142857146, "percentage": 98.98, "elapsed_time": "1:06:19", "remaining_time": "0:00:41"}
{"current_steps": 971, "total_steps": 980, "loss": 0.0065, "lr": 3.1714412245148486e-09, "epoch": 34.67857142857143, "percentage": 99.08, "elapsed_time": "1:06:22", "remaining_time": "0:00:36"}
{"current_steps": 972, "total_steps": 980, "loss": 0.0088, "lr": 2.568918996560532e-09, "epoch": 34.714285714285715, "percentage": 99.18, "elapsed_time": "1:06:27", "remaining_time": "0:00:32"}
{"current_steps": 973, "total_steps": 980, "loss": 0.009, "lr": 2.029799640409502e-09, "epoch": 34.75, "percentage": 99.29, "elapsed_time": "1:06:31", "remaining_time": "0:00:28"}
{"current_steps": 974, "total_steps": 980, "loss": 0.0072, "lr": 1.5540899959187727e-09, "epoch": 34.785714285714285, "percentage": 99.39, "elapsed_time": "1:06:35", "remaining_time": "0:00:24"}
{"current_steps": 975, "total_steps": 980, "loss": 0.0056, "lr": 1.1417960984605459e-09, "epoch": 34.82142857142857, "percentage": 99.49, "elapsed_time": "1:06:38", "remaining_time": "0:00:20"}
{"current_steps": 976, "total_steps": 980, "loss": 0.0073, "lr": 7.92923178845606e-10, "epoch": 34.857142857142854, "percentage": 99.59, "elapsed_time": "1:06:41", "remaining_time": "0:00:16"}
{"current_steps": 977, "total_steps": 980, "loss": 0.0084, "lr": 5.07475663257262e-10, "epoch": 34.892857142857146, "percentage": 99.69, "elapsed_time": "1:06:45", "remaining_time": "0:00:12"}
{"current_steps": 978, "total_steps": 980, "loss": 0.0059, "lr": 2.854571731947253e-10, "epoch": 34.92857142857143, "percentage": 99.8, "elapsed_time": "1:06:48", "remaining_time": "0:00:08"}
{"current_steps": 979, "total_steps": 980, "loss": 0.008, "lr": 1.2687052542759148e-10, "epoch": 34.964285714285715, "percentage": 99.9, "elapsed_time": "1:06:52", "remaining_time": "0:00:04"}
{"current_steps": 980, "total_steps": 980, "loss": 0.0075, "lr": 3.171773195809191e-11, "epoch": 35.0, "percentage": 100.0, "elapsed_time": "1:06:56", "remaining_time": "0:00:00"}
{"current_steps": 980, "total_steps": 980, "epoch": 35.0, "percentage": 100.0, "elapsed_time": "1:07:40", "remaining_time": "0:00:00"}