Training in progress, step 1432
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4144e04a93cc1cc9597e0f6be4482dd4c3fdc977d05750ca5e75070a8a77b9f
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98f08b8b8aa161bb8e09372a0722bb2526bc2715118f6159f922607c9fde7233
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24df8ea9836da349bb165dfac07269c61919f32554fb1d80400e9e67141680f4
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87e8a73cb26cdb9e5f963b420d52b0d1af812374ff5808b2a9bac3b33e5b718d
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -1209,3 +1209,225 @@
|
|
1209 |
{"current_steps": 1209, "total_steps": 1432, "loss": 0.4699, "lr": 7.279029772675572e-07, "epoch": 1.6877470355731226, "percentage": 84.43, "elapsed_time": "2:44:31", "remaining_time": "0:30:20"}
|
1210 |
{"current_steps": 1210, "total_steps": 1432, "loss": 0.4537, "lr": 7.215790412887802e-07, "epoch": 1.6891420599860498, "percentage": 84.5, "elapsed_time": "2:44:38", "remaining_time": "0:30:12"}
|
1211 |
{"current_steps": 1211, "total_steps": 1432, "loss": 0.4089, "lr": 7.152805590332079e-07, "epoch": 1.690537084398977, "percentage": 84.57, "elapsed_time": "2:44:46", "remaining_time": "0:30:04"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1209 |
{"current_steps": 1209, "total_steps": 1432, "loss": 0.4699, "lr": 7.279029772675572e-07, "epoch": 1.6877470355731226, "percentage": 84.43, "elapsed_time": "2:44:31", "remaining_time": "0:30:20"}
|
1210 |
{"current_steps": 1210, "total_steps": 1432, "loss": 0.4537, "lr": 7.215790412887802e-07, "epoch": 1.6891420599860498, "percentage": 84.5, "elapsed_time": "2:44:38", "remaining_time": "0:30:12"}
|
1211 |
{"current_steps": 1211, "total_steps": 1432, "loss": 0.4089, "lr": 7.152805590332079e-07, "epoch": 1.690537084398977, "percentage": 84.57, "elapsed_time": "2:44:46", "remaining_time": "0:30:04"}
|
1212 |
+
{"current_steps": 1212, "total_steps": 1432, "loss": 0.4576, "lr": 7.090075679725683e-07, "epoch": 1.6919321088119044, "percentage": 84.64, "elapsed_time": "2:45:01", "remaining_time": "0:29:57"}
|
1213 |
+
{"current_steps": 1213, "total_steps": 1432, "loss": 0.4222, "lr": 7.027601054269329e-07, "epoch": 1.6933271332248314, "percentage": 84.71, "elapsed_time": "2:45:07", "remaining_time": "0:29:48"}
|
1214 |
+
{"current_steps": 1214, "total_steps": 1432, "loss": 0.4908, "lr": 6.965382085644968e-07, "epoch": 1.6947221576377587, "percentage": 84.78, "elapsed_time": "2:45:16", "remaining_time": "0:29:40"}
|
1215 |
+
{"current_steps": 1215, "total_steps": 1432, "loss": 0.4417, "lr": 6.903419144013556e-07, "epoch": 1.6961171820506857, "percentage": 84.85, "elapsed_time": "2:45:22", "remaining_time": "0:29:32"}
|
1216 |
+
{"current_steps": 1216, "total_steps": 1432, "loss": 0.408, "lr": 6.841712598012867e-07, "epoch": 1.697512206463613, "percentage": 84.92, "elapsed_time": "2:45:29", "remaining_time": "0:29:23"}
|
1217 |
+
{"current_steps": 1217, "total_steps": 1432, "loss": 0.4148, "lr": 6.780262814755284e-07, "epoch": 1.6989072308765403, "percentage": 84.99, "elapsed_time": "2:45:35", "remaining_time": "0:29:15"}
|
1218 |
+
{"current_steps": 1218, "total_steps": 1432, "loss": 0.4612, "lr": 6.719070159825642e-07, "epoch": 1.7003022552894675, "percentage": 85.06, "elapsed_time": "2:45:42", "remaining_time": "0:29:06"}
|
1219 |
+
{"current_steps": 1219, "total_steps": 1432, "loss": 0.5169, "lr": 6.65813499727902e-07, "epoch": 1.7016972797023948, "percentage": 85.13, "elapsed_time": "2:45:50", "remaining_time": "0:28:58"}
|
1220 |
+
{"current_steps": 1220, "total_steps": 1432, "loss": 0.4311, "lr": 6.597457689638598e-07, "epoch": 1.703092304115322, "percentage": 85.2, "elapsed_time": "2:45:59", "remaining_time": "0:28:50"}
|
1221 |
+
{"current_steps": 1221, "total_steps": 1432, "loss": 0.4401, "lr": 6.53703859789348e-07, "epoch": 1.7044873285282494, "percentage": 85.27, "elapsed_time": "2:46:06", "remaining_time": "0:28:42"}
|
1222 |
+
{"current_steps": 1222, "total_steps": 1432, "loss": 0.4084, "lr": 6.476878081496579e-07, "epoch": 1.7058823529411766, "percentage": 85.34, "elapsed_time": "2:46:13", "remaining_time": "0:28:33"}
|
1223 |
+
{"current_steps": 1223, "total_steps": 1432, "loss": 0.4444, "lr": 6.416976498362432e-07, "epoch": 1.7072773773541037, "percentage": 85.41, "elapsed_time": "2:46:20", "remaining_time": "0:28:25"}
|
1224 |
+
{"current_steps": 1224, "total_steps": 1432, "loss": 0.4296, "lr": 6.357334204865156e-07, "epoch": 1.708672401767031, "percentage": 85.47, "elapsed_time": "2:46:29", "remaining_time": "0:28:17"}
|
1225 |
+
{"current_steps": 1225, "total_steps": 1432, "loss": 0.4681, "lr": 6.29795155583619e-07, "epoch": 1.710067426179958, "percentage": 85.54, "elapsed_time": "2:46:35", "remaining_time": "0:28:09"}
|
1226 |
+
{"current_steps": 1226, "total_steps": 1432, "loss": 0.4148, "lr": 6.238828904562316e-07, "epoch": 1.7114624505928853, "percentage": 85.61, "elapsed_time": "2:46:42", "remaining_time": "0:28:00"}
|
1227 |
+
{"current_steps": 1227, "total_steps": 1432, "loss": 0.4311, "lr": 6.179966602783493e-07, "epoch": 1.7128574750058125, "percentage": 85.68, "elapsed_time": "2:46:50", "remaining_time": "0:27:52"}
|
1228 |
+
{"current_steps": 1228, "total_steps": 1432, "loss": 0.4598, "lr": 6.121365000690766e-07, "epoch": 1.7142524994187398, "percentage": 85.75, "elapsed_time": "2:46:57", "remaining_time": "0:27:44"}
|
1229 |
+
{"current_steps": 1229, "total_steps": 1432, "loss": 0.4421, "lr": 6.063024446924198e-07, "epoch": 1.715647523831667, "percentage": 85.82, "elapsed_time": "2:47:03", "remaining_time": "0:27:35"}
|
1230 |
+
{"current_steps": 1230, "total_steps": 1432, "loss": 0.4881, "lr": 6.004945288570813e-07, "epoch": 1.7170425482445943, "percentage": 85.89, "elapsed_time": "2:47:10", "remaining_time": "0:27:27"}
|
1231 |
+
{"current_steps": 1231, "total_steps": 1432, "loss": 0.4533, "lr": 5.947127871162455e-07, "epoch": 1.7184375726575216, "percentage": 85.96, "elapsed_time": "2:47:18", "remaining_time": "0:27:19"}
|
1232 |
+
{"current_steps": 1232, "total_steps": 1432, "loss": 0.4133, "lr": 5.889572538673826e-07, "epoch": 1.7198325970704489, "percentage": 86.03, "elapsed_time": "2:47:28", "remaining_time": "0:27:11"}
|
1233 |
+
{"current_steps": 1233, "total_steps": 1432, "loss": 0.4401, "lr": 5.832279633520411e-07, "epoch": 1.721227621483376, "percentage": 86.1, "elapsed_time": "2:47:34", "remaining_time": "0:27:02"}
|
1234 |
+
{"current_steps": 1234, "total_steps": 1432, "loss": 0.4857, "lr": 5.775249496556406e-07, "epoch": 1.7226226458963032, "percentage": 86.17, "elapsed_time": "2:47:42", "remaining_time": "0:26:54"}
|
1235 |
+
{"current_steps": 1235, "total_steps": 1432, "loss": 0.4431, "lr": 5.718482467072695e-07, "epoch": 1.7240176703092303, "percentage": 86.24, "elapsed_time": "2:47:51", "remaining_time": "0:26:46"}
|
1236 |
+
{"current_steps": 1236, "total_steps": 1432, "loss": 0.4292, "lr": 5.661978882794883e-07, "epoch": 1.7254126947221575, "percentage": 86.31, "elapsed_time": "2:48:00", "remaining_time": "0:26:38"}
|
1237 |
+
{"current_steps": 1237, "total_steps": 1432, "loss": 0.436, "lr": 5.60573907988124e-07, "epoch": 1.7268077191350848, "percentage": 86.38, "elapsed_time": "2:48:07", "remaining_time": "0:26:30"}
|
1238 |
+
{"current_steps": 1238, "total_steps": 1432, "loss": 0.4379, "lr": 5.54976339292072e-07, "epoch": 1.728202743548012, "percentage": 86.45, "elapsed_time": "2:48:16", "remaining_time": "0:26:22"}
|
1239 |
+
{"current_steps": 1239, "total_steps": 1432, "loss": 0.5001, "lr": 5.494052154930956e-07, "epoch": 1.7295977679609393, "percentage": 86.52, "elapsed_time": "2:48:25", "remaining_time": "0:26:14"}
|
1240 |
+
{"current_steps": 1240, "total_steps": 1432, "loss": 0.4067, "lr": 5.438605697356309e-07, "epoch": 1.7309927923738666, "percentage": 86.59, "elapsed_time": "2:48:33", "remaining_time": "0:26:06"}
|
1241 |
+
{"current_steps": 1241, "total_steps": 1432, "loss": 0.4641, "lr": 5.383424350065825e-07, "epoch": 1.7323878167867939, "percentage": 86.66, "elapsed_time": "2:48:42", "remaining_time": "0:25:57"}
|
1242 |
+
{"current_steps": 1242, "total_steps": 1432, "loss": 0.4055, "lr": 5.328508441351382e-07, "epoch": 1.7337828411997211, "percentage": 86.73, "elapsed_time": "2:48:49", "remaining_time": "0:25:49"}
|
1243 |
+
{"current_steps": 1243, "total_steps": 1432, "loss": 0.4874, "lr": 5.273858297925649e-07, "epoch": 1.7351778656126482, "percentage": 86.8, "elapsed_time": "2:48:58", "remaining_time": "0:25:41"}
|
1244 |
+
{"current_steps": 1244, "total_steps": 1432, "loss": 0.4354, "lr": 5.219474244920164e-07, "epoch": 1.7365728900255755, "percentage": 86.87, "elapsed_time": "2:49:04", "remaining_time": "0:25:33"}
|
1245 |
+
{"current_steps": 1245, "total_steps": 1432, "loss": 0.4151, "lr": 5.165356605883432e-07, "epoch": 1.7379679144385025, "percentage": 86.94, "elapsed_time": "2:49:10", "remaining_time": "0:25:24"}
|
1246 |
+
{"current_steps": 1246, "total_steps": 1432, "loss": 0.4411, "lr": 5.111505702778935e-07, "epoch": 1.7393629388514298, "percentage": 87.01, "elapsed_time": "2:49:16", "remaining_time": "0:25:16"}
|
1247 |
+
{"current_steps": 1247, "total_steps": 1432, "loss": 0.3942, "lr": 5.057921855983288e-07, "epoch": 1.740757963264357, "percentage": 87.08, "elapsed_time": "2:49:22", "remaining_time": "0:25:07"}
|
1248 |
+
{"current_steps": 1248, "total_steps": 1432, "loss": 0.4238, "lr": 5.004605384284295e-07, "epoch": 1.7421529876772843, "percentage": 87.15, "elapsed_time": "2:49:30", "remaining_time": "0:24:59"}
|
1249 |
+
{"current_steps": 1249, "total_steps": 1432, "loss": 0.4466, "lr": 4.951556604879049e-07, "epoch": 1.7435480120902116, "percentage": 87.22, "elapsed_time": "2:49:39", "remaining_time": "0:24:51"}
|
1250 |
+
{"current_steps": 1250, "total_steps": 1432, "loss": 0.43, "lr": 4.898775833372055e-07, "epoch": 1.7449430365031389, "percentage": 87.29, "elapsed_time": "2:49:51", "remaining_time": "0:24:43"}
|
1251 |
+
{"current_steps": 1251, "total_steps": 1432, "loss": 0.4687, "lr": 4.846263383773364e-07, "epoch": 1.7463380609160661, "percentage": 87.36, "elapsed_time": "2:49:59", "remaining_time": "0:24:35"}
|
1252 |
+
{"current_steps": 1252, "total_steps": 1432, "loss": 0.4575, "lr": 4.794019568496683e-07, "epoch": 1.7477330853289934, "percentage": 87.43, "elapsed_time": "2:50:05", "remaining_time": "0:24:27"}
|
1253 |
+
{"current_steps": 1253, "total_steps": 1432, "loss": 0.4148, "lr": 4.7420446983575286e-07, "epoch": 1.7491281097419205, "percentage": 87.5, "elapsed_time": "2:50:12", "remaining_time": "0:24:18"}
|
1254 |
+
{"current_steps": 1254, "total_steps": 1432, "loss": 0.4326, "lr": 4.690339082571366e-07, "epoch": 1.7505231341548477, "percentage": 87.57, "elapsed_time": "2:50:22", "remaining_time": "0:24:11"}
|
1255 |
+
{"current_steps": 1255, "total_steps": 1432, "loss": 0.4645, "lr": 4.638903028751796e-07, "epoch": 1.7519181585677748, "percentage": 87.64, "elapsed_time": "2:50:28", "remaining_time": "0:24:02"}
|
1256 |
+
{"current_steps": 1256, "total_steps": 1432, "loss": 0.3935, "lr": 4.5877368429086857e-07, "epoch": 1.753313182980702, "percentage": 87.71, "elapsed_time": "2:50:35", "remaining_time": "0:23:54"}
|
1257 |
+
{"current_steps": 1257, "total_steps": 1432, "loss": 0.4569, "lr": 4.5368408294463873e-07, "epoch": 1.7547082073936293, "percentage": 87.78, "elapsed_time": "2:50:45", "remaining_time": "0:23:46"}
|
1258 |
+
{"current_steps": 1258, "total_steps": 1432, "loss": 0.4907, "lr": 4.486215291161894e-07, "epoch": 1.7561032318065566, "percentage": 87.85, "elapsed_time": "2:50:56", "remaining_time": "0:23:38"}
|
1259 |
+
{"current_steps": 1259, "total_steps": 1432, "loss": 0.4436, "lr": 4.4358605292430743e-07, "epoch": 1.7574982562194839, "percentage": 87.92, "elapsed_time": "2:51:03", "remaining_time": "0:23:30"}
|
1260 |
+
{"current_steps": 1260, "total_steps": 1432, "loss": 0.4743, "lr": 4.385776843266842e-07, "epoch": 1.7588932806324111, "percentage": 87.99, "elapsed_time": "2:51:17", "remaining_time": "0:23:22"}
|
1261 |
+
{"current_steps": 1261, "total_steps": 1432, "loss": 0.4965, "lr": 4.335964531197401e-07, "epoch": 1.7602883050453384, "percentage": 88.06, "elapsed_time": "2:51:27", "remaining_time": "0:23:15"}
|
1262 |
+
{"current_steps": 1262, "total_steps": 1432, "loss": 0.4296, "lr": 4.286423889384456e-07, "epoch": 1.7616833294582657, "percentage": 88.13, "elapsed_time": "2:51:35", "remaining_time": "0:23:06"}
|
1263 |
+
{"current_steps": 1263, "total_steps": 1432, "loss": 0.4642, "lr": 4.2371552125614614e-07, "epoch": 1.7630783538711927, "percentage": 88.2, "elapsed_time": "2:51:44", "remaining_time": "0:22:58"}
|
1264 |
+
{"current_steps": 1264, "total_steps": 1432, "loss": 0.4555, "lr": 4.1881587938438606e-07, "epoch": 1.76447337828412, "percentage": 88.27, "elapsed_time": "2:51:56", "remaining_time": "0:22:51"}
|
1265 |
+
{"current_steps": 1265, "total_steps": 1432, "loss": 0.4449, "lr": 4.139434924727359e-07, "epoch": 1.765868402697047, "percentage": 88.34, "elapsed_time": "2:52:04", "remaining_time": "0:22:42"}
|
1266 |
+
{"current_steps": 1266, "total_steps": 1432, "loss": 0.4128, "lr": 4.090983895086137e-07, "epoch": 1.7672634271099743, "percentage": 88.41, "elapsed_time": "2:52:11", "remaining_time": "0:22:34"}
|
1267 |
+
{"current_steps": 1267, "total_steps": 1432, "loss": 0.4334, "lr": 4.0428059931712116e-07, "epoch": 1.7686584515229016, "percentage": 88.48, "elapsed_time": "2:52:18", "remaining_time": "0:22:26"}
|
1268 |
+
{"current_steps": 1268, "total_steps": 1432, "loss": 0.436, "lr": 3.994901505608628e-07, "epoch": 1.7700534759358288, "percentage": 88.55, "elapsed_time": "2:52:25", "remaining_time": "0:22:18"}
|
1269 |
+
{"current_steps": 1269, "total_steps": 1432, "loss": 0.4376, "lr": 3.94727071739785e-07, "epoch": 1.7714485003487561, "percentage": 88.62, "elapsed_time": "2:52:32", "remaining_time": "0:22:09"}
|
1270 |
+
{"current_steps": 1270, "total_steps": 1432, "loss": 0.4075, "lr": 3.899913911909986e-07, "epoch": 1.7728435247616834, "percentage": 88.69, "elapsed_time": "2:52:38", "remaining_time": "0:22:01"}
|
1271 |
+
{"current_steps": 1271, "total_steps": 1432, "loss": 0.4488, "lr": 3.8528313708861173e-07, "epoch": 1.7742385491746107, "percentage": 88.76, "elapsed_time": "2:52:45", "remaining_time": "0:21:52"}
|
1272 |
+
{"current_steps": 1272, "total_steps": 1432, "loss": 0.461, "lr": 3.8060233744356634e-07, "epoch": 1.775633573587538, "percentage": 88.83, "elapsed_time": "2:52:51", "remaining_time": "0:21:44"}
|
1273 |
+
{"current_steps": 1273, "total_steps": 1432, "loss": 0.4508, "lr": 3.759490201034677e-07, "epoch": 1.777028598000465, "percentage": 88.9, "elapsed_time": "2:53:02", "remaining_time": "0:21:36"}
|
1274 |
+
{"current_steps": 1274, "total_steps": 1432, "loss": 0.453, "lr": 3.7132321275241966e-07, "epoch": 1.7784236224133922, "percentage": 88.97, "elapsed_time": "2:53:08", "remaining_time": "0:21:28"}
|
1275 |
+
{"current_steps": 1275, "total_steps": 1432, "loss": 0.4554, "lr": 3.6672494291086156e-07, "epoch": 1.7798186468263193, "percentage": 89.04, "elapsed_time": "2:53:15", "remaining_time": "0:21:20"}
|
1276 |
+
{"current_steps": 1276, "total_steps": 1432, "loss": 0.4386, "lr": 3.6215423793540036e-07, "epoch": 1.7812136712392466, "percentage": 89.11, "elapsed_time": "2:53:22", "remaining_time": "0:21:11"}
|
1277 |
+
{"current_steps": 1277, "total_steps": 1432, "loss": 0.4894, "lr": 3.576111250186526e-07, "epoch": 1.7826086956521738, "percentage": 89.18, "elapsed_time": "2:53:31", "remaining_time": "0:21:03"}
|
1278 |
+
{"current_steps": 1278, "total_steps": 1432, "loss": 0.4553, "lr": 3.530956311890815e-07, "epoch": 1.784003720065101, "percentage": 89.25, "elapsed_time": "2:53:40", "remaining_time": "0:20:55"}
|
1279 |
+
{"current_steps": 1279, "total_steps": 1432, "loss": 0.414, "lr": 3.486077833108342e-07, "epoch": 1.7853987444780284, "percentage": 89.32, "elapsed_time": "2:53:46", "remaining_time": "0:20:47"}
|
1280 |
+
{"current_steps": 1280, "total_steps": 1432, "loss": 0.4794, "lr": 3.441476080835826e-07, "epoch": 1.7867937688909556, "percentage": 89.39, "elapsed_time": "2:53:53", "remaining_time": "0:20:38"}
|
1281 |
+
{"current_steps": 1281, "total_steps": 1432, "loss": 0.4163, "lr": 3.397151320423647e-07, "epoch": 1.788188793303883, "percentage": 89.46, "elapsed_time": "2:53:59", "remaining_time": "0:20:30"}
|
1282 |
+
{"current_steps": 1282, "total_steps": 1432, "loss": 0.4323, "lr": 3.353103815574282e-07, "epoch": 1.7895838177168102, "percentage": 89.53, "elapsed_time": "2:54:06", "remaining_time": "0:20:22"}
|
1283 |
+
{"current_steps": 1283, "total_steps": 1432, "loss": 0.4629, "lr": 3.309333828340722e-07, "epoch": 1.7909788421297372, "percentage": 89.59, "elapsed_time": "2:54:15", "remaining_time": "0:20:14"}
|
1284 |
+
{"current_steps": 1284, "total_steps": 1432, "loss": 0.4476, "lr": 3.2658416191249045e-07, "epoch": 1.7923738665426645, "percentage": 89.66, "elapsed_time": "2:54:21", "remaining_time": "0:20:05"}
|
1285 |
+
{"current_steps": 1285, "total_steps": 1432, "loss": 0.4355, "lr": 3.2226274466761906e-07, "epoch": 1.7937688909555918, "percentage": 89.73, "elapsed_time": "2:54:29", "remaining_time": "0:19:57"}
|
1286 |
+
{"current_steps": 1286, "total_steps": 1432, "loss": 0.4844, "lr": 3.179691568089799e-07, "epoch": 1.7951639153685188, "percentage": 89.8, "elapsed_time": "2:54:38", "remaining_time": "0:19:49"}
|
1287 |
+
{"current_steps": 1287, "total_steps": 1432, "loss": 0.4641, "lr": 3.137034238805292e-07, "epoch": 1.796558939781446, "percentage": 89.87, "elapsed_time": "2:54:48", "remaining_time": "0:19:41"}
|
1288 |
+
{"current_steps": 1288, "total_steps": 1432, "loss": 0.4353, "lr": 3.0946557126050435e-07, "epoch": 1.7979539641943734, "percentage": 89.94, "elapsed_time": "2:54:55", "remaining_time": "0:19:33"}
|
1289 |
+
{"current_steps": 1289, "total_steps": 1432, "loss": 0.4474, "lr": 3.0525562416127473e-07, "epoch": 1.7993489886073006, "percentage": 90.01, "elapsed_time": "2:55:02", "remaining_time": "0:19:25"}
|
1290 |
+
{"current_steps": 1290, "total_steps": 1432, "loss": 0.3931, "lr": 3.010736076291909e-07, "epoch": 1.800744013020228, "percentage": 90.08, "elapsed_time": "2:55:08", "remaining_time": "0:19:16"}
|
1291 |
+
{"current_steps": 1291, "total_steps": 1432, "loss": 0.4305, "lr": 2.9691954654443353e-07, "epoch": 1.8021390374331552, "percentage": 90.15, "elapsed_time": "2:55:15", "remaining_time": "0:19:08"}
|
1292 |
+
{"current_steps": 1292, "total_steps": 1432, "loss": 0.4049, "lr": 2.927934656208681e-07, "epoch": 1.8035340618460824, "percentage": 90.22, "elapsed_time": "2:55:23", "remaining_time": "0:19:00"}
|
1293 |
+
{"current_steps": 1293, "total_steps": 1432, "loss": 0.4269, "lr": 2.88695389405898e-07, "epoch": 1.8049290862590095, "percentage": 90.29, "elapsed_time": "2:55:30", "remaining_time": "0:18:52"}
|
1294 |
+
{"current_steps": 1294, "total_steps": 1432, "loss": 0.4754, "lr": 2.8462534228031636e-07, "epoch": 1.8063241106719368, "percentage": 90.36, "elapsed_time": "2:55:41", "remaining_time": "0:18:44"}
|
1295 |
+
{"current_steps": 1295, "total_steps": 1432, "loss": 0.5274, "lr": 2.8058334845816214e-07, "epoch": 1.807719135084864, "percentage": 90.43, "elapsed_time": "2:55:49", "remaining_time": "0:18:36"}
|
1296 |
+
{"current_steps": 1296, "total_steps": 1432, "loss": 0.4648, "lr": 2.765694319865775e-07, "epoch": 1.809114159497791, "percentage": 90.5, "elapsed_time": "2:55:56", "remaining_time": "0:18:27"}
|
1297 |
+
{"current_steps": 1297, "total_steps": 1432, "loss": 0.4601, "lr": 2.725836167456608e-07, "epoch": 1.8105091839107184, "percentage": 90.57, "elapsed_time": "2:56:02", "remaining_time": "0:18:19"}
|
1298 |
+
{"current_steps": 1298, "total_steps": 1432, "loss": 0.385, "lr": 2.6862592644832875e-07, "epoch": 1.8119042083236456, "percentage": 90.64, "elapsed_time": "2:56:09", "remaining_time": "0:18:11"}
|
1299 |
+
{"current_steps": 1299, "total_steps": 1432, "loss": 0.451, "lr": 2.646963846401729e-07, "epoch": 1.813299232736573, "percentage": 90.71, "elapsed_time": "2:56:15", "remaining_time": "0:18:02"}
|
1300 |
+
{"current_steps": 1300, "total_steps": 1432, "loss": 0.4129, "lr": 2.6079501469932154e-07, "epoch": 1.8146942571495002, "percentage": 90.78, "elapsed_time": "2:56:23", "remaining_time": "0:17:54"}
|
1301 |
+
{"current_steps": 1301, "total_steps": 1432, "loss": 0.4314, "lr": 2.569218398362971e-07, "epoch": 1.8160892815624274, "percentage": 90.85, "elapsed_time": "2:56:32", "remaining_time": "0:17:46"}
|
1302 |
+
{"current_steps": 1302, "total_steps": 1432, "loss": 0.4533, "lr": 2.530768830938818e-07, "epoch": 1.8174843059753547, "percentage": 90.92, "elapsed_time": "2:56:40", "remaining_time": "0:17:38"}
|
1303 |
+
{"current_steps": 1303, "total_steps": 1432, "loss": 0.3923, "lr": 2.49260167346978e-07, "epoch": 1.8188793303882818, "percentage": 90.99, "elapsed_time": "2:56:46", "remaining_time": "0:17:30"}
|
1304 |
+
{"current_steps": 1304, "total_steps": 1432, "loss": 0.4466, "lr": 2.4547171530247437e-07, "epoch": 1.820274354801209, "percentage": 91.06, "elapsed_time": "2:56:55", "remaining_time": "0:17:21"}
|
1305 |
+
{"current_steps": 1305, "total_steps": 1432, "loss": 0.4087, "lr": 2.417115494991107e-07, "epoch": 1.8216693792141363, "percentage": 91.13, "elapsed_time": "2:57:02", "remaining_time": "0:17:13"}
|
1306 |
+
{"current_steps": 1306, "total_steps": 1432, "loss": 0.4821, "lr": 2.3797969230733853e-07, "epoch": 1.8230644036270633, "percentage": 91.2, "elapsed_time": "2:57:16", "remaining_time": "0:17:06"}
|
1307 |
+
{"current_steps": 1307, "total_steps": 1432, "loss": 0.5061, "lr": 2.3427616592919587e-07, "epoch": 1.8244594280399906, "percentage": 91.27, "elapsed_time": "2:57:31", "remaining_time": "0:16:58"}
|
1308 |
+
{"current_steps": 1308, "total_steps": 1432, "loss": 0.4408, "lr": 2.3060099239817059e-07, "epoch": 1.8258544524529179, "percentage": 91.34, "elapsed_time": "2:57:40", "remaining_time": "0:16:50"}
|
1309 |
+
{"current_steps": 1309, "total_steps": 1432, "loss": 0.443, "lr": 2.2695419357906978e-07, "epoch": 1.8272494768658452, "percentage": 91.41, "elapsed_time": "2:57:47", "remaining_time": "0:16:42"}
|
1310 |
+
{"current_steps": 1310, "total_steps": 1432, "loss": 0.4114, "lr": 2.2333579116788962e-07, "epoch": 1.8286445012787724, "percentage": 91.48, "elapsed_time": "2:57:55", "remaining_time": "0:16:34"}
|
1311 |
+
{"current_steps": 1311, "total_steps": 1432, "loss": 0.483, "lr": 2.197458066916891e-07, "epoch": 1.8300395256916997, "percentage": 91.55, "elapsed_time": "2:58:03", "remaining_time": "0:16:26"}
|
1312 |
+
{"current_steps": 1312, "total_steps": 1432, "loss": 0.442, "lr": 2.161842615084564e-07, "epoch": 1.831434550104627, "percentage": 91.62, "elapsed_time": "2:58:09", "remaining_time": "0:16:17"}
|
1313 |
+
{"current_steps": 1313, "total_steps": 1432, "loss": 0.4395, "lr": 2.1265117680698665e-07, "epoch": 1.832829574517554, "percentage": 91.69, "elapsed_time": "2:58:17", "remaining_time": "0:16:09"}
|
1314 |
+
{"current_steps": 1314, "total_steps": 1432, "loss": 0.4567, "lr": 2.0914657360675606e-07, "epoch": 1.8342245989304813, "percentage": 91.76, "elapsed_time": "2:58:23", "remaining_time": "0:16:01"}
|
1315 |
+
{"current_steps": 1315, "total_steps": 1432, "loss": 0.4169, "lr": 2.0567047275779184e-07, "epoch": 1.8356196233434086, "percentage": 91.83, "elapsed_time": "2:58:33", "remaining_time": "0:15:53"}
|
1316 |
+
{"current_steps": 1316, "total_steps": 1432, "loss": 0.4349, "lr": 2.0222289494055357e-07, "epoch": 1.8370146477563356, "percentage": 91.9, "elapsed_time": "2:58:43", "remaining_time": "0:15:45"}
|
1317 |
+
{"current_steps": 1317, "total_steps": 1432, "loss": 0.4603, "lr": 1.988038606658066e-07, "epoch": 1.8384096721692629, "percentage": 91.97, "elapsed_time": "2:58:50", "remaining_time": "0:15:36"}
|
1318 |
+
{"current_steps": 1318, "total_steps": 1432, "loss": 0.4345, "lr": 1.9541339027450256e-07, "epoch": 1.8398046965821901, "percentage": 92.04, "elapsed_time": "2:58:58", "remaining_time": "0:15:28"}
|
1319 |
+
{"current_steps": 1319, "total_steps": 1432, "loss": 0.4481, "lr": 1.9205150393765692e-07, "epoch": 1.8411997209951174, "percentage": 92.11, "elapsed_time": "2:59:06", "remaining_time": "0:15:20"}
|
1320 |
+
{"current_steps": 1320, "total_steps": 1432, "loss": 0.4643, "lr": 1.887182216562289e-07, "epoch": 1.8425947454080447, "percentage": 92.18, "elapsed_time": "2:59:17", "remaining_time": "0:15:12"}
|
1321 |
+
{"current_steps": 1321, "total_steps": 1432, "loss": 0.4577, "lr": 1.8541356326100436e-07, "epoch": 1.843989769820972, "percentage": 92.25, "elapsed_time": "2:59:24", "remaining_time": "0:15:04"}
|
1322 |
+
{"current_steps": 1322, "total_steps": 1432, "loss": 0.4779, "lr": 1.821375484124721e-07, "epoch": 1.8453847942338992, "percentage": 92.32, "elapsed_time": "2:59:30", "remaining_time": "0:14:56"}
|
1323 |
+
{"current_steps": 1323, "total_steps": 1432, "loss": 0.449, "lr": 1.7889019660071728e-07, "epoch": 1.8467798186468263, "percentage": 92.39, "elapsed_time": "2:59:36", "remaining_time": "0:14:47"}
|
1324 |
+
{"current_steps": 1324, "total_steps": 1432, "loss": 0.4373, "lr": 1.7567152714529468e-07, "epoch": 1.8481748430597535, "percentage": 92.46, "elapsed_time": "2:59:44", "remaining_time": "0:14:39"}
|
1325 |
+
{"current_steps": 1325, "total_steps": 1432, "loss": 0.4246, "lr": 1.7248155919512067e-07, "epoch": 1.8495698674726808, "percentage": 92.53, "elapsed_time": "2:59:53", "remaining_time": "0:14:31"}
|
1326 |
+
{"current_steps": 1326, "total_steps": 1432, "loss": 0.4932, "lr": 1.693203117283543e-07, "epoch": 1.8509648918856079, "percentage": 92.6, "elapsed_time": "3:00:01", "remaining_time": "0:14:23"}
|
1327 |
+
{"current_steps": 1327, "total_steps": 1432, "loss": 0.4591, "lr": 1.6618780355229069e-07, "epoch": 1.8523599162985351, "percentage": 92.67, "elapsed_time": "3:00:11", "remaining_time": "0:14:15"}
|
1328 |
+
{"current_steps": 1328, "total_steps": 1432, "loss": 0.4462, "lr": 1.6308405330324294e-07, "epoch": 1.8537549407114624, "percentage": 92.74, "elapsed_time": "3:00:17", "remaining_time": "0:14:07"}
|
1329 |
+
{"current_steps": 1329, "total_steps": 1432, "loss": 0.4401, "lr": 1.6000907944643428e-07, "epoch": 1.8551499651243897, "percentage": 92.81, "elapsed_time": "3:00:27", "remaining_time": "0:13:59"}
|
1330 |
+
{"current_steps": 1330, "total_steps": 1432, "loss": 0.4671, "lr": 1.5696290027588933e-07, "epoch": 1.856544989537317, "percentage": 92.88, "elapsed_time": "3:00:33", "remaining_time": "0:13:50"}
|
1331 |
+
{"current_steps": 1331, "total_steps": 1432, "loss": 0.4419, "lr": 1.5394553391432142e-07, "epoch": 1.8579400139502442, "percentage": 92.95, "elapsed_time": "3:00:39", "remaining_time": "0:13:42"}
|
1332 |
+
{"current_steps": 1332, "total_steps": 1432, "loss": 0.4559, "lr": 1.5095699831302935e-07, "epoch": 1.8593350383631715, "percentage": 93.02, "elapsed_time": "3:00:46", "remaining_time": "0:13:34"}
|
1333 |
+
{"current_steps": 1333, "total_steps": 1432, "loss": 0.3962, "lr": 1.479973112517863e-07, "epoch": 1.8607300627760985, "percentage": 93.09, "elapsed_time": "3:00:54", "remaining_time": "0:13:26"}
|
1334 |
+
{"current_steps": 1334, "total_steps": 1432, "loss": 0.4032, "lr": 1.450664903387372e-07, "epoch": 1.8621250871890258, "percentage": 93.16, "elapsed_time": "3:01:00", "remaining_time": "0:13:17"}
|
1335 |
+
{"current_steps": 1335, "total_steps": 1432, "loss": 0.4072, "lr": 1.4216455301029274e-07, "epoch": 1.863520111601953, "percentage": 93.23, "elapsed_time": "3:01:10", "remaining_time": "0:13:09"}
|
1336 |
+
{"current_steps": 1336, "total_steps": 1432, "loss": 0.4359, "lr": 1.3929151653102546e-07, "epoch": 1.8649151360148801, "percentage": 93.3, "elapsed_time": "3:01:17", "remaining_time": "0:13:01"}
|
1337 |
+
{"current_steps": 1337, "total_steps": 1432, "loss": 0.4028, "lr": 1.3644739799356765e-07, "epoch": 1.8663101604278074, "percentage": 93.37, "elapsed_time": "3:01:23", "remaining_time": "0:12:53"}
|
1338 |
+
{"current_steps": 1338, "total_steps": 1432, "loss": 0.4239, "lr": 1.3363221431850816e-07, "epoch": 1.8677051848407347, "percentage": 93.44, "elapsed_time": "3:01:31", "remaining_time": "0:12:45"}
|
1339 |
+
{"current_steps": 1339, "total_steps": 1432, "loss": 0.4067, "lr": 1.308459822542951e-07, "epoch": 1.869100209253662, "percentage": 93.51, "elapsed_time": "3:01:39", "remaining_time": "0:12:37"}
|
1340 |
+
{"current_steps": 1340, "total_steps": 1432, "loss": 0.4981, "lr": 1.2808871837713177e-07, "epoch": 1.8704952336665892, "percentage": 93.58, "elapsed_time": "3:01:47", "remaining_time": "0:12:28"}
|
1341 |
+
{"current_steps": 1341, "total_steps": 1432, "loss": 0.4133, "lr": 1.253604390908819e-07, "epoch": 1.8718902580795165, "percentage": 93.65, "elapsed_time": "3:01:53", "remaining_time": "0:12:20"}
|
1342 |
+
{"current_steps": 1342, "total_steps": 1432, "loss": 0.4306, "lr": 1.2266116062696954e-07, "epoch": 1.8732852824924437, "percentage": 93.72, "elapsed_time": "3:02:00", "remaining_time": "0:12:12"}
|
1343 |
+
{"current_steps": 1343, "total_steps": 1432, "loss": 0.4544, "lr": 1.1999089904428385e-07, "epoch": 1.8746803069053708, "percentage": 93.78, "elapsed_time": "3:02:08", "remaining_time": "0:12:04"}
|
1344 |
+
{"current_steps": 1344, "total_steps": 1432, "loss": 0.3989, "lr": 1.1734967022908217e-07, "epoch": 1.876075331318298, "percentage": 93.85, "elapsed_time": "3:02:15", "remaining_time": "0:11:55"}
|
1345 |
+
{"current_steps": 1345, "total_steps": 1432, "loss": 0.407, "lr": 1.1473748989489775e-07, "epoch": 1.8774703557312253, "percentage": 93.92, "elapsed_time": "3:02:25", "remaining_time": "0:11:47"}
|
1346 |
+
{"current_steps": 1346, "total_steps": 1432, "loss": 0.4283, "lr": 1.121543735824443e-07, "epoch": 1.8788653801441524, "percentage": 93.99, "elapsed_time": "3:02:35", "remaining_time": "0:11:39"}
|
1347 |
+
{"current_steps": 1347, "total_steps": 1432, "loss": 0.46, "lr": 1.096003366595233e-07, "epoch": 1.8802604045570797, "percentage": 94.06, "elapsed_time": "3:02:41", "remaining_time": "0:11:31"}
|
1348 |
+
{"current_steps": 1348, "total_steps": 1432, "loss": 0.4333, "lr": 1.0707539432093517e-07, "epoch": 1.881655428970007, "percentage": 94.13, "elapsed_time": "3:02:48", "remaining_time": "0:11:23"}
|
1349 |
+
{"current_steps": 1349, "total_steps": 1432, "loss": 0.4215, "lr": 1.0457956158838545e-07, "epoch": 1.8830504533829342, "percentage": 94.2, "elapsed_time": "3:02:58", "remaining_time": "0:11:15"}
|
1350 |
+
{"current_steps": 1350, "total_steps": 1432, "loss": 0.4667, "lr": 1.0211285331039933e-07, "epoch": 1.8844454777958615, "percentage": 94.27, "elapsed_time": "3:03:07", "remaining_time": "0:11:07"}
|
1351 |
+
{"current_steps": 1351, "total_steps": 1432, "loss": 0.4549, "lr": 9.967528416222838e-08, "epoch": 1.8858405022087887, "percentage": 94.34, "elapsed_time": "3:03:16", "remaining_time": "0:10:59"}
|
1352 |
+
{"current_steps": 1352, "total_steps": 1432, "loss": 0.4569, "lr": 9.72668686457684e-08, "epoch": 1.887235526621716, "percentage": 94.41, "elapsed_time": "3:03:23", "remaining_time": "0:10:51"}
|
1353 |
+
{"current_steps": 1353, "total_steps": 1432, "loss": 0.3936, "lr": 9.488762108946891e-08, "epoch": 1.888630551034643, "percentage": 94.48, "elapsed_time": "3:03:30", "remaining_time": "0:10:42"}
|
1354 |
+
{"current_steps": 1354, "total_steps": 1432, "loss": 0.4036, "lr": 9.25375556482505e-08, "epoch": 1.8900255754475703, "percentage": 94.55, "elapsed_time": "3:03:36", "remaining_time": "0:10:34"}
|
1355 |
+
{"current_steps": 1355, "total_steps": 1432, "loss": 0.4374, "lr": 9.02166863034204e-08, "epoch": 1.8914205998604976, "percentage": 94.62, "elapsed_time": "3:03:42", "remaining_time": "0:10:26"}
|
1356 |
+
{"current_steps": 1356, "total_steps": 1432, "loss": 0.4398, "lr": 8.792502686258752e-08, "epoch": 1.8928156242734246, "percentage": 94.69, "elapsed_time": "3:03:50", "remaining_time": "0:10:18"}
|
1357 |
+
{"current_steps": 1357, "total_steps": 1432, "loss": 0.42, "lr": 8.566259095958207e-08, "epoch": 1.894210648686352, "percentage": 94.76, "elapsed_time": "3:03:57", "remaining_time": "0:10:10"}
|
1358 |
+
{"current_steps": 1358, "total_steps": 1432, "loss": 0.4899, "lr": 8.342939205437384e-08, "epoch": 1.8956056730992792, "percentage": 94.83, "elapsed_time": "3:04:05", "remaining_time": "0:10:01"}
|
1359 |
+
{"current_steps": 1359, "total_steps": 1432, "loss": 0.4246, "lr": 8.122544343299343e-08, "epoch": 1.8970006975122065, "percentage": 94.9, "elapsed_time": "3:04:11", "remaining_time": "0:09:53"}
|
1360 |
+
{"current_steps": 1360, "total_steps": 1432, "loss": 0.4156, "lr": 7.905075820744956e-08, "epoch": 1.8983957219251337, "percentage": 94.97, "elapsed_time": "3:04:18", "remaining_time": "0:09:45"}
|
1361 |
+
{"current_steps": 1361, "total_steps": 1432, "loss": 0.4056, "lr": 7.690534931565519e-08, "epoch": 1.899790746338061, "percentage": 95.04, "elapsed_time": "3:04:25", "remaining_time": "0:09:37"}
|
1362 |
+
{"current_steps": 1362, "total_steps": 1432, "loss": 0.4129, "lr": 7.478922952134815e-08, "epoch": 1.9011857707509883, "percentage": 95.11, "elapsed_time": "3:04:32", "remaining_time": "0:09:29"}
|
1363 |
+
{"current_steps": 1363, "total_steps": 1432, "loss": 0.5071, "lr": 7.270241141401568e-08, "epoch": 1.9025807951639153, "percentage": 95.18, "elapsed_time": "3:04:39", "remaining_time": "0:09:20"}
|
1364 |
+
{"current_steps": 1364, "total_steps": 1432, "loss": 0.4423, "lr": 7.064490740882057e-08, "epoch": 1.9039758195768426, "percentage": 95.25, "elapsed_time": "3:04:45", "remaining_time": "0:09:12"}
|
1365 |
+
{"current_steps": 1365, "total_steps": 1432, "loss": 0.4315, "lr": 6.861672974652622e-08, "epoch": 1.9053708439897699, "percentage": 95.32, "elapsed_time": "3:04:52", "remaining_time": "0:09:04"}
|
1366 |
+
{"current_steps": 1366, "total_steps": 1432, "loss": 0.4372, "lr": 6.661789049342282e-08, "epoch": 1.906765868402697, "percentage": 95.39, "elapsed_time": "3:04:59", "remaining_time": "0:08:56"}
|
1367 |
+
{"current_steps": 1367, "total_steps": 1432, "loss": 0.4441, "lr": 6.464840154125795e-08, "epoch": 1.9081608928156242, "percentage": 95.46, "elapsed_time": "3:05:06", "remaining_time": "0:08:48"}
|
1368 |
+
{"current_steps": 1368, "total_steps": 1432, "loss": 0.4599, "lr": 6.270827460716499e-08, "epoch": 1.9095559172285514, "percentage": 95.53, "elapsed_time": "3:05:14", "remaining_time": "0:08:39"}
|
1369 |
+
{"current_steps": 1369, "total_steps": 1432, "loss": 0.4065, "lr": 6.079752123359261e-08, "epoch": 1.9109509416414787, "percentage": 95.6, "elapsed_time": "3:05:20", "remaining_time": "0:08:31"}
|
1370 |
+
{"current_steps": 1370, "total_steps": 1432, "loss": 0.4273, "lr": 5.891615278823537e-08, "epoch": 1.912345966054406, "percentage": 95.67, "elapsed_time": "3:05:27", "remaining_time": "0:08:23"}
|
1371 |
+
{"current_steps": 1371, "total_steps": 1432, "loss": 0.4753, "lr": 5.7064180463969886e-08, "epoch": 1.9137409904673333, "percentage": 95.74, "elapsed_time": "3:05:36", "remaining_time": "0:08:15"}
|
1372 |
+
{"current_steps": 1372, "total_steps": 1432, "loss": 0.4113, "lr": 5.5241615278783245e-08, "epoch": 1.9151360148802605, "percentage": 95.81, "elapsed_time": "3:05:42", "remaining_time": "0:08:07"}
|
1373 |
+
{"current_steps": 1373, "total_steps": 1432, "loss": 0.4652, "lr": 5.34484680757108e-08, "epoch": 1.9165310392931876, "percentage": 95.88, "elapsed_time": "3:05:52", "remaining_time": "0:07:59"}
|
1374 |
+
{"current_steps": 1374, "total_steps": 1432, "loss": 0.476, "lr": 5.168474952277125e-08, "epoch": 1.9179260637061148, "percentage": 95.95, "elapsed_time": "3:05:59", "remaining_time": "0:07:51"}
|
1375 |
+
{"current_steps": 1375, "total_steps": 1432, "loss": 0.4438, "lr": 4.995047011290166e-08, "epoch": 1.9193210881190421, "percentage": 96.02, "elapsed_time": "3:06:07", "remaining_time": "0:07:42"}
|
1376 |
+
{"current_steps": 1376, "total_steps": 1432, "loss": 0.3857, "lr": 4.8245640163896433e-08, "epoch": 1.9207161125319692, "percentage": 96.09, "elapsed_time": "3:06:16", "remaining_time": "0:07:34"}
|
1377 |
+
{"current_steps": 1377, "total_steps": 1432, "loss": 0.4163, "lr": 4.657026981834623e-08, "epoch": 1.9221111369448964, "percentage": 96.16, "elapsed_time": "3:06:23", "remaining_time": "0:07:26"}
|
1378 |
+
{"current_steps": 1378, "total_steps": 1432, "loss": 0.438, "lr": 4.4924369043575776e-08, "epoch": 1.9235061613578237, "percentage": 96.23, "elapsed_time": "3:06:30", "remaining_time": "0:07:18"}
|
1379 |
+
{"current_steps": 1379, "total_steps": 1432, "loss": 0.4566, "lr": 4.330794763158619e-08, "epoch": 1.924901185770751, "percentage": 96.3, "elapsed_time": "3:06:40", "remaining_time": "0:07:10"}
|
1380 |
+
{"current_steps": 1380, "total_steps": 1432, "loss": 0.4004, "lr": 4.172101519899607e-08, "epoch": 1.9262962101836782, "percentage": 96.37, "elapsed_time": "3:06:47", "remaining_time": "0:07:02"}
|
1381 |
+
{"current_steps": 1381, "total_steps": 1432, "loss": 0.4773, "lr": 4.0163581186984935e-08, "epoch": 1.9276912345966055, "percentage": 96.44, "elapsed_time": "3:06:53", "remaining_time": "0:06:54"}
|
1382 |
+
{"current_steps": 1382, "total_steps": 1432, "loss": 0.4552, "lr": 3.8635654861235994e-08, "epoch": 1.9290862590095328, "percentage": 96.51, "elapsed_time": "3:07:03", "remaining_time": "0:06:46"}
|
1383 |
+
{"current_steps": 1383, "total_steps": 1432, "loss": 0.4947, "lr": 3.713724531188234e-08, "epoch": 1.93048128342246, "percentage": 96.58, "elapsed_time": "3:07:09", "remaining_time": "0:06:37"}
|
1384 |
+
{"current_steps": 1384, "total_steps": 1432, "loss": 0.4119, "lr": 3.566836145345032e-08, "epoch": 1.931876307835387, "percentage": 96.65, "elapsed_time": "3:07:18", "remaining_time": "0:06:29"}
|
1385 |
+
{"current_steps": 1385, "total_steps": 1432, "loss": 0.4251, "lr": 3.4229012024811215e-08, "epoch": 1.9332713322483144, "percentage": 96.72, "elapsed_time": "3:07:25", "remaining_time": "0:06:21"}
|
1386 |
+
{"current_steps": 1386, "total_steps": 1432, "loss": 0.4448, "lr": 3.28192055891241e-08, "epoch": 1.9346663566612414, "percentage": 96.79, "elapsed_time": "3:07:33", "remaining_time": "0:06:13"}
|
1387 |
+
{"current_steps": 1387, "total_steps": 1432, "loss": 0.4333, "lr": 3.143895053378698e-08, "epoch": 1.9360613810741687, "percentage": 96.86, "elapsed_time": "3:07:39", "remaining_time": "0:06:05"}
|
1388 |
+
{"current_steps": 1388, "total_steps": 1432, "loss": 0.4744, "lr": 3.0088255070389037e-08, "epoch": 1.937456405487096, "percentage": 96.93, "elapsed_time": "3:07:46", "remaining_time": "0:05:57"}
|
1389 |
+
{"current_steps": 1389, "total_steps": 1432, "loss": 0.4018, "lr": 2.876712723465791e-08, "epoch": 1.9388514299000232, "percentage": 97.0, "elapsed_time": "3:07:53", "remaining_time": "0:05:48"}
|
1390 |
+
{"current_steps": 1390, "total_steps": 1432, "loss": 0.4332, "lr": 2.7475574886414726e-08, "epoch": 1.9402464543129505, "percentage": 97.07, "elapsed_time": "3:08:00", "remaining_time": "0:05:40"}
|
1391 |
+
{"current_steps": 1391, "total_steps": 1432, "loss": 0.4138, "lr": 2.6213605709525803e-08, "epoch": 1.9416414787258778, "percentage": 97.14, "elapsed_time": "3:08:08", "remaining_time": "0:05:32"}
|
1392 |
+
{"current_steps": 1392, "total_steps": 1432, "loss": 0.3667, "lr": 2.498122721185825e-08, "epoch": 1.943036503138805, "percentage": 97.21, "elapsed_time": "3:08:15", "remaining_time": "0:05:24"}
|
1393 |
+
{"current_steps": 1393, "total_steps": 1432, "loss": 0.4528, "lr": 2.3778446725233328e-08, "epoch": 1.9444315275517323, "percentage": 97.28, "elapsed_time": "3:08:22", "remaining_time": "0:05:16"}
|
1394 |
+
{"current_steps": 1394, "total_steps": 1432, "loss": 0.3904, "lr": 2.2605271405385932e-08, "epoch": 1.9458265519646594, "percentage": 97.35, "elapsed_time": "3:08:29", "remaining_time": "0:05:08"}
|
1395 |
+
{"current_steps": 1395, "total_steps": 1432, "loss": 0.408, "lr": 2.1461708231919064e-08, "epoch": 1.9472215763775866, "percentage": 97.42, "elapsed_time": "3:08:38", "remaining_time": "0:05:00"}
|
1396 |
+
{"current_steps": 1396, "total_steps": 1432, "loss": 0.4298, "lr": 2.0347764008262216e-08, "epoch": 1.9486166007905137, "percentage": 97.49, "elapsed_time": "3:08:45", "remaining_time": "0:04:52"}
|
1397 |
+
{"current_steps": 1397, "total_steps": 1432, "loss": 0.5449, "lr": 1.926344536163416e-08, "epoch": 1.950011625203441, "percentage": 97.56, "elapsed_time": "3:08:51", "remaining_time": "0:04:43"}
|
1398 |
+
{"current_steps": 1398, "total_steps": 1432, "loss": 0.3951, "lr": 1.820875874300021e-08, "epoch": 1.9514066496163682, "percentage": 97.63, "elapsed_time": "3:08:59", "remaining_time": "0:04:35"}
|
1399 |
+
{"current_steps": 1399, "total_steps": 1432, "loss": 0.4529, "lr": 1.7183710427035595e-08, "epoch": 1.9528016740292955, "percentage": 97.7, "elapsed_time": "3:09:06", "remaining_time": "0:04:27"}
|
1400 |
+
{"current_steps": 1400, "total_steps": 1432, "loss": 0.4549, "lr": 1.6188306512087692e-08, "epoch": 1.9541966984422228, "percentage": 97.77, "elapsed_time": "3:09:17", "remaining_time": "0:04:19"}
|
1401 |
+
{"current_steps": 1401, "total_steps": 1432, "loss": 0.4751, "lr": 1.5222552920138855e-08, "epoch": 1.95559172285515, "percentage": 97.84, "elapsed_time": "3:09:24", "remaining_time": "0:04:11"}
|
1402 |
+
{"current_steps": 1402, "total_steps": 1432, "loss": 0.4438, "lr": 1.4286455396773092e-08, "epoch": 1.9569867472680773, "percentage": 97.91, "elapsed_time": "3:09:32", "remaining_time": "0:04:03"}
|
1403 |
+
{"current_steps": 1403, "total_steps": 1432, "loss": 0.444, "lr": 1.338001951113943e-08, "epoch": 1.9583817716810046, "percentage": 97.97, "elapsed_time": "3:09:40", "remaining_time": "0:03:55"}
|
1404 |
+
{"current_steps": 1404, "total_steps": 1432, "loss": 0.4264, "lr": 1.250325065592195e-08, "epoch": 1.9597767960939316, "percentage": 98.04, "elapsed_time": "3:09:47", "remaining_time": "0:03:47"}
|
1405 |
+
{"current_steps": 1405, "total_steps": 1432, "loss": 0.4593, "lr": 1.1656154047303691e-08, "epoch": 1.961171820506859, "percentage": 98.11, "elapsed_time": "3:09:55", "remaining_time": "0:03:38"}
|
1406 |
+
{"current_steps": 1406, "total_steps": 1432, "loss": 0.4464, "lr": 1.083873472494057e-08, "epoch": 1.962566844919786, "percentage": 98.18, "elapsed_time": "3:10:03", "remaining_time": "0:03:30"}
|
1407 |
+
{"current_steps": 1407, "total_steps": 1432, "loss": 0.45, "lr": 1.005099755192529e-08, "epoch": 1.9639618693327132, "percentage": 98.25, "elapsed_time": "3:10:11", "remaining_time": "0:03:22"}
|
1408 |
+
{"current_steps": 1408, "total_steps": 1432, "loss": 0.4871, "lr": 9.292947214764036e-09, "epoch": 1.9653568937456405, "percentage": 98.32, "elapsed_time": "3:10:23", "remaining_time": "0:03:14"}
|
1409 |
+
{"current_steps": 1409, "total_steps": 1432, "loss": 0.4249, "lr": 8.564588223346493e-09, "epoch": 1.9667519181585678, "percentage": 98.39, "elapsed_time": "3:10:30", "remaining_time": "0:03:06"}
|
1410 |
+
{"current_steps": 1410, "total_steps": 1432, "loss": 0.4233, "lr": 7.865924910916977e-09, "epoch": 1.968146942571495, "percentage": 98.46, "elapsed_time": "3:10:36", "remaining_time": "0:02:58"}
|
1411 |
+
{"current_steps": 1411, "total_steps": 1432, "loss": 0.4357, "lr": 7.196961434052796e-09, "epoch": 1.9695419669844223, "percentage": 98.53, "elapsed_time": "3:10:45", "remaining_time": "0:02:50"}
|
1412 |
+
{"current_steps": 1412, "total_steps": 1432, "loss": 0.4814, "lr": 6.557701772635372e-09, "epoch": 1.9709369913973496, "percentage": 98.6, "elapsed_time": "3:10:51", "remaining_time": "0:02:42"}
|
1413 |
+
{"current_steps": 1413, "total_steps": 1432, "loss": 0.4307, "lr": 5.9481497298291556e-09, "epoch": 1.9723320158102768, "percentage": 98.67, "elapsed_time": "3:10:58", "remaining_time": "0:02:34"}
|
1414 |
+
{"current_steps": 1414, "total_steps": 1432, "loss": 0.3866, "lr": 5.368308932058863e-09, "epoch": 1.9737270402232039, "percentage": 98.74, "elapsed_time": "3:11:05", "remaining_time": "0:02:25"}
|
1415 |
+
{"current_steps": 1415, "total_steps": 1432, "loss": 0.4183, "lr": 4.818182828985607e-09, "epoch": 1.9751220646361312, "percentage": 98.81, "elapsed_time": "3:11:11", "remaining_time": "0:02:17"}
|
1416 |
+
{"current_steps": 1416, "total_steps": 1432, "loss": 0.4314, "lr": 4.2977746934907975e-09, "epoch": 1.9765170890490582, "percentage": 98.88, "elapsed_time": "3:11:18", "remaining_time": "0:02:09"}
|
1417 |
+
{"current_steps": 1417, "total_steps": 1432, "loss": 0.4657, "lr": 3.807087621650607e-09, "epoch": 1.9779121134619855, "percentage": 98.95, "elapsed_time": "3:11:30", "remaining_time": "0:02:01"}
|
1418 |
+
{"current_steps": 1418, "total_steps": 1432, "loss": 0.4398, "lr": 3.3461245327237603e-09, "epoch": 1.9793071378749127, "percentage": 99.02, "elapsed_time": "3:11:42", "remaining_time": "0:01:53"}
|
1419 |
+
{"current_steps": 1419, "total_steps": 1432, "loss": 0.4006, "lr": 2.9148881691298812e-09, "epoch": 1.98070216228784, "percentage": 99.09, "elapsed_time": "3:11:56", "remaining_time": "0:01:45"}
|
1420 |
+
{"current_steps": 1420, "total_steps": 1432, "loss": 0.4378, "lr": 2.5133810964350635e-09, "epoch": 1.9820971867007673, "percentage": 99.16, "elapsed_time": "3:12:06", "remaining_time": "0:01:37"}
|
1421 |
+
{"current_steps": 1421, "total_steps": 1432, "loss": 0.4599, "lr": 2.1416057033352144e-09, "epoch": 1.9834922111136946, "percentage": 99.23, "elapsed_time": "3:12:16", "remaining_time": "0:01:29"}
|
1422 |
+
{"current_steps": 1422, "total_steps": 1432, "loss": 0.4657, "lr": 1.7995642016449544e-09, "epoch": 1.9848872355266218, "percentage": 99.3, "elapsed_time": "3:12:23", "remaining_time": "0:01:21"}
|
1423 |
+
{"current_steps": 1423, "total_steps": 1432, "loss": 0.4324, "lr": 1.4872586262792975e-09, "epoch": 1.986282259939549, "percentage": 99.37, "elapsed_time": "3:12:29", "remaining_time": "0:01:13"}
|
1424 |
+
{"current_steps": 1424, "total_steps": 1432, "loss": 0.4817, "lr": 1.2046908352475462e-09, "epoch": 1.9876772843524761, "percentage": 99.44, "elapsed_time": "3:12:36", "remaining_time": "0:01:04"}
|
1425 |
+
{"current_steps": 1425, "total_steps": 1432, "loss": 0.4473, "lr": 9.518625096366364e-10, "epoch": 1.9890723087654034, "percentage": 99.51, "elapsed_time": "3:12:42", "remaining_time": "0:00:56"}
|
1426 |
+
{"current_steps": 1426, "total_steps": 1432, "loss": 0.411, "lr": 7.287751536050324e-10, "epoch": 1.9904673331783305, "percentage": 99.58, "elapsed_time": "3:12:49", "remaining_time": "0:00:48"}
|
1427 |
+
{"current_steps": 1427, "total_steps": 1432, "loss": 0.4586, "lr": 5.354300943727353e-10, "epoch": 1.9918623575912577, "percentage": 99.65, "elapsed_time": "3:12:56", "remaining_time": "0:00:40"}
|
1428 |
+
{"current_steps": 1428, "total_steps": 1432, "loss": 0.4408, "lr": 3.718284822118445e-10, "epoch": 1.993257382004185, "percentage": 99.72, "elapsed_time": "3:13:03", "remaining_time": "0:00:32"}
|
1429 |
+
{"current_steps": 1429, "total_steps": 1432, "loss": 0.3978, "lr": 2.379712904426734e-10, "epoch": 1.9946524064171123, "percentage": 99.79, "elapsed_time": "3:13:11", "remaining_time": "0:00:24"}
|
1430 |
+
{"current_steps": 1430, "total_steps": 1432, "loss": 0.4362, "lr": 1.3385931542486686e-10, "epoch": 1.9960474308300395, "percentage": 99.86, "elapsed_time": "3:13:20", "remaining_time": "0:00:16"}
|
1431 |
+
{"current_steps": 1431, "total_steps": 1432, "loss": 0.4613, "lr": 5.949317655462583e-11, "epoch": 1.9974424552429668, "percentage": 99.93, "elapsed_time": "3:13:29", "remaining_time": "0:00:08"}
|
1432 |
+
{"current_steps": 1432, "total_steps": 1432, "loss": 0.4646, "lr": 1.4873316260266558e-11, "epoch": 1.998837479655894, "percentage": 100.0, "elapsed_time": "3:13:39", "remaining_time": "0:00:00"}
|
1433 |
+
{"current_steps": 1432, "total_steps": 1432, "epoch": 1.998837479655894, "percentage": 100.0, "elapsed_time": "3:15:26", "remaining_time": "0:00:00"}
|