Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:deb310f3b83115834b77de27499bca5834c24906a9bfb77965373a5efa4f9a48
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ce9fd9ec93b9724307779484a565c9ec0389ee1c4eaa037bf80fc9be9432a0a
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e62577d2230e25561169b8b06fcab4dfeacb9c16f91156cc8e3528a72f650159
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc557beaeb050bbf5f550c395b3b81e3e70346ffa1c1081cfea81d7ab50e788b
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -220,3 +220,115 @@
|
|
220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4106, "lr": 5.006611372971982e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:13:25", "remaining_time": "10:54:04"}
|
221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.3995, "lr": 4.928827983136444e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:18:56", "remaining_time": "10:48:09"}
|
222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4229, "lr": 4.8513836384346175e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:24:56", "remaining_time": "10:42:28"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4106, "lr": 5.006611372971982e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:13:25", "remaining_time": "10:54:04"}
|
221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.3995, "lr": 4.928827983136444e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:18:56", "remaining_time": "10:48:09"}
|
222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4229, "lr": 4.8513836384346175e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:24:56", "remaining_time": "10:42:28"}
|
223 |
+
{"current_steps": 223, "total_steps": 333, "loss": 0.72, "lr": 4.774286888413083e-05, "epoch": 2.0061763054463784, "percentage": 66.97, "elapsed_time": "21:31:25", "remaining_time": "10:37:01"}
|
224 |
+
{"current_steps": 224, "total_steps": 333, "loss": 0.3579, "lr": 4.697546244245351e-05, "epoch": 2.0151600224592925, "percentage": 67.27, "elapsed_time": "21:37:07", "remaining_time": "10:31:11"}
|
225 |
+
{"current_steps": 225, "total_steps": 333, "loss": 0.3791, "lr": 4.6211701777922695e-05, "epoch": 2.0241437394722066, "percentage": 67.57, "elapsed_time": "21:43:11", "remaining_time": "10:25:32"}
|
226 |
+
{"current_steps": 226, "total_steps": 333, "loss": 0.3665, "lr": 4.545167120666758e-05, "epoch": 2.0331274564851207, "percentage": 67.87, "elapsed_time": "21:48:59", "remaining_time": "10:19:44"}
|
227 |
+
{"current_steps": 227, "total_steps": 333, "loss": 0.3715, "lr": 4.469545463303e-05, "epoch": 2.042111173498035, "percentage": 68.17, "elapsed_time": "21:55:00", "remaining_time": "10:14:03"}
|
228 |
+
{"current_steps": 228, "total_steps": 333, "loss": 0.3641, "lr": 4.394313554030163e-05, "epoch": 2.051094890510949, "percentage": 68.47, "elapsed_time": "22:00:51", "remaining_time": "10:08:17"}
|
229 |
+
{"current_steps": 229, "total_steps": 333, "loss": 0.3781, "lr": 4.3194796981507835e-05, "epoch": 2.060078607523863, "percentage": 68.77, "elapsed_time": "22:06:33", "remaining_time": "10:02:27"}
|
230 |
+
{"current_steps": 230, "total_steps": 333, "loss": 0.3645, "lr": 4.245052157023891e-05, "epoch": 2.069062324536777, "percentage": 69.07, "elapsed_time": "22:12:21", "remaining_time": "9:56:40"}
|
231 |
+
{"current_steps": 231, "total_steps": 333, "loss": 0.3654, "lr": 4.1710391471529894e-05, "epoch": 2.0780460415496913, "percentage": 69.37, "elapsed_time": "22:18:24", "remaining_time": "9:50:59"}
|
232 |
+
{"current_steps": 232, "total_steps": 333, "loss": 0.3681, "lr": 4.0974488392789824e-05, "epoch": 2.0870297585626054, "percentage": 69.67, "elapsed_time": "22:24:13", "remaining_time": "9:45:11"}
|
233 |
+
{"current_steps": 233, "total_steps": 333, "loss": 0.3544, "lr": 4.0242893574781645e-05, "epoch": 2.0960134755755195, "percentage": 69.97, "elapsed_time": "22:30:07", "remaining_time": "9:39:27"}
|
234 |
+
{"current_steps": 234, "total_steps": 333, "loss": 0.3685, "lr": 3.951568778265347e-05, "epoch": 2.1049971925884337, "percentage": 70.27, "elapsed_time": "22:35:38", "remaining_time": "9:33:32"}
|
235 |
+
{"current_steps": 235, "total_steps": 333, "loss": 0.367, "lr": 3.879295129702254e-05, "epoch": 2.1139809096013478, "percentage": 70.57, "elapsed_time": "22:41:31", "remaining_time": "9:27:47"}
|
236 |
+
{"current_steps": 236, "total_steps": 333, "loss": 0.3627, "lr": 3.807476390511243e-05, "epoch": 2.1229646266142614, "percentage": 70.87, "elapsed_time": "22:47:21", "remaining_time": "9:22:00"}
|
237 |
+
{"current_steps": 237, "total_steps": 333, "loss": 0.371, "lr": 3.7361204891944926e-05, "epoch": 2.1319483436271756, "percentage": 71.17, "elapsed_time": "22:53:15", "remaining_time": "9:16:15"}
|
238 |
+
{"current_steps": 238, "total_steps": 333, "loss": 0.3604, "lr": 3.66523530315873e-05, "epoch": 2.1409320606400897, "percentage": 71.47, "elapsed_time": "22:59:01", "remaining_time": "9:10:26"}
|
239 |
+
{"current_steps": 239, "total_steps": 333, "loss": 0.3624, "lr": 3.594828657845594e-05, "epoch": 2.149915777653004, "percentage": 71.77, "elapsed_time": "23:04:45", "remaining_time": "9:04:37"}
|
240 |
+
{"current_steps": 240, "total_steps": 333, "loss": 0.3639, "lr": 3.524908325867735e-05, "epoch": 2.158899494665918, "percentage": 72.07, "elapsed_time": "23:10:22", "remaining_time": "8:58:46"}
|
241 |
+
{"current_steps": 241, "total_steps": 333, "loss": 0.3544, "lr": 3.455482026150755e-05, "epoch": 2.167883211678832, "percentage": 72.37, "elapsed_time": "23:16:14", "remaining_time": "8:53:00"}
|
242 |
+
{"current_steps": 242, "total_steps": 333, "loss": 0.3773, "lr": 3.3865574230810636e-05, "epoch": 2.176866928691746, "percentage": 72.67, "elapsed_time": "23:22:02", "remaining_time": "8:47:12"}
|
243 |
+
{"current_steps": 243, "total_steps": 333, "loss": 0.3825, "lr": 3.318142125659765e-05, "epoch": 2.1858506457046603, "percentage": 72.97, "elapsed_time": "23:27:43", "remaining_time": "8:41:22"}
|
244 |
+
{"current_steps": 244, "total_steps": 333, "loss": 0.3579, "lr": 3.250243686662651e-05, "epoch": 2.1948343627175744, "percentage": 73.27, "elapsed_time": "23:33:08", "remaining_time": "8:35:26"}
|
245 |
+
{"current_steps": 245, "total_steps": 333, "loss": 0.3626, "lr": 3.182869601806406e-05, "epoch": 2.2038180797304885, "percentage": 73.57, "elapsed_time": "23:38:48", "remaining_time": "8:29:36"}
|
246 |
+
{"current_steps": 246, "total_steps": 333, "loss": 0.3573, "lr": 3.11602730892111e-05, "epoch": 2.2128017967434026, "percentage": 73.87, "elapsed_time": "23:44:29", "remaining_time": "8:23:46"}
|
247 |
+
{"current_steps": 247, "total_steps": 333, "loss": 0.3667, "lr": 3.0497241871291333e-05, "epoch": 2.2217855137563167, "percentage": 74.17, "elapsed_time": "23:50:13", "remaining_time": "8:17:58"}
|
248 |
+
{"current_steps": 248, "total_steps": 333, "loss": 0.3539, "lr": 2.9839675560305088e-05, "epoch": 2.230769230769231, "percentage": 74.47, "elapsed_time": "23:55:48", "remaining_time": "8:12:06"}
|
249 |
+
{"current_steps": 249, "total_steps": 333, "loss": 0.3618, "lr": 2.918764674894875e-05, "epoch": 2.239752947782145, "percentage": 74.77, "elapsed_time": "1 day, 0:01:34", "remaining_time": "8:06:18"}
|
250 |
+
{"current_steps": 250, "total_steps": 333, "loss": 0.3624, "lr": 2.8541227418600858e-05, "epoch": 2.248736664795059, "percentage": 75.08, "elapsed_time": "1 day, 0:07:15", "remaining_time": "8:00:29"}
|
251 |
+
{"current_steps": 251, "total_steps": 333, "loss": 0.3664, "lr": 2.7900488931375666e-05, "epoch": 2.257720381807973, "percentage": 75.38, "elapsed_time": "1 day, 0:13:13", "remaining_time": "7:54:45"}
|
252 |
+
{"current_steps": 252, "total_steps": 333, "loss": 0.372, "lr": 2.7265502022244993e-05, "epoch": 2.2667040988208873, "percentage": 75.68, "elapsed_time": "1 day, 0:19:15", "remaining_time": "7:49:02"}
|
253 |
+
{"current_steps": 253, "total_steps": 333, "loss": 0.3601, "lr": 2.6636336791229393e-05, "epoch": 2.2756878158338014, "percentage": 75.98, "elapsed_time": "1 day, 0:24:49", "remaining_time": "7:43:11"}
|
254 |
+
{"current_steps": 254, "total_steps": 333, "loss": 0.3779, "lr": 2.6013062695659397e-05, "epoch": 2.2846715328467155, "percentage": 76.28, "elapsed_time": "1 day, 0:30:42", "remaining_time": "7:37:25"}
|
255 |
+
{"current_steps": 255, "total_steps": 333, "loss": 0.3628, "lr": 2.539574854250769e-05, "epoch": 2.293655249859629, "percentage": 76.58, "elapsed_time": "1 day, 0:36:41", "remaining_time": "7:31:41"}
|
256 |
+
{"current_steps": 256, "total_steps": 333, "loss": 0.3706, "lr": 2.4784462480793084e-05, "epoch": 2.3026389668725433, "percentage": 76.88, "elapsed_time": "1 day, 0:42:17", "remaining_time": "7:25:50"}
|
257 |
+
{"current_steps": 257, "total_steps": 333, "loss": 0.3702, "lr": 2.4179271994057184e-05, "epoch": 2.3116226838854574, "percentage": 77.18, "elapsed_time": "1 day, 0:48:10", "remaining_time": "7:20:04"}
|
258 |
+
{"current_steps": 258, "total_steps": 333, "loss": 0.3573, "lr": 2.3580243892914424e-05, "epoch": 2.3206064008983716, "percentage": 77.48, "elapsed_time": "1 day, 0:54:03", "remaining_time": "7:14:19"}
|
259 |
+
{"current_steps": 259, "total_steps": 333, "loss": 0.3758, "lr": 2.2987444307676478e-05, "epoch": 2.3295901179112857, "percentage": 77.78, "elapsed_time": "1 day, 0:59:54", "remaining_time": "7:08:32"}
|
260 |
+
{"current_steps": 260, "total_steps": 333, "loss": 0.3511, "lr": 2.24009386810517e-05, "epoch": 2.3385738349242, "percentage": 78.08, "elapsed_time": "1 day, 1:05:27", "remaining_time": "7:02:41"}
|
261 |
+
{"current_steps": 261, "total_steps": 333, "loss": 0.3716, "lr": 2.1820791760920547e-05, "epoch": 2.347557551937114, "percentage": 78.38, "elapsed_time": "1 day, 1:11:01", "remaining_time": "6:56:50"}
|
262 |
+
{"current_steps": 262, "total_steps": 333, "loss": 0.3683, "lr": 2.124706759318766e-05, "epoch": 2.356541268950028, "percentage": 78.68, "elapsed_time": "1 day, 1:16:40", "remaining_time": "6:51:00"}
|
263 |
+
{"current_steps": 263, "total_steps": 333, "loss": 0.3646, "lr": 2.0679829514711436e-05, "epoch": 2.365524985962942, "percentage": 78.98, "elapsed_time": "1 day, 1:22:35", "remaining_time": "6:45:15"}
|
264 |
+
{"current_steps": 264, "total_steps": 333, "loss": 0.3686, "lr": 2.0119140146311905e-05, "epoch": 2.3745087029758563, "percentage": 79.28, "elapsed_time": "1 day, 1:28:17", "remaining_time": "6:39:26"}
|
265 |
+
{"current_steps": 265, "total_steps": 333, "loss": 0.3682, "lr": 1.9565061385857663e-05, "epoch": 2.3834924199887704, "percentage": 79.58, "elapsed_time": "1 day, 1:34:11", "remaining_time": "6:33:40"}
|
266 |
+
{"current_steps": 266, "total_steps": 333, "loss": 0.3717, "lr": 1.9017654401432546e-05, "epoch": 2.3924761370016845, "percentage": 79.88, "elapsed_time": "1 day, 1:40:01", "remaining_time": "6:27:54"}
|
267 |
+
{"current_steps": 267, "total_steps": 333, "loss": 0.3581, "lr": 1.8476979624582937e-05, "epoch": 2.4014598540145986, "percentage": 80.18, "elapsed_time": "1 day, 1:45:51", "remaining_time": "6:22:07"}
|
268 |
+
{"current_steps": 268, "total_steps": 333, "loss": 0.37, "lr": 1.794309674364641e-05, "epoch": 2.4104435710275127, "percentage": 80.48, "elapsed_time": "1 day, 1:51:51", "remaining_time": "6:16:22"}
|
269 |
+
{"current_steps": 269, "total_steps": 333, "loss": 0.3736, "lr": 1.7416064697162287e-05, "epoch": 2.419427288040427, "percentage": 80.78, "elapsed_time": "1 day, 1:57:35", "remaining_time": "6:10:34"}
|
270 |
+
{"current_steps": 270, "total_steps": 333, "loss": 0.3535, "lr": 1.6895941667365168e-05, "epoch": 2.428411005053341, "percentage": 81.08, "elapsed_time": "1 day, 2:03:18", "remaining_time": "6:04:46"}
|
271 |
+
{"current_steps": 271, "total_steps": 333, "loss": 0.3571, "lr": 1.6382785073761703e-05, "epoch": 2.437394722066255, "percentage": 81.38, "elapsed_time": "1 day, 2:09:20", "remaining_time": "5:59:02"}
|
272 |
+
{"current_steps": 272, "total_steps": 333, "loss": 0.3658, "lr": 1.587665156679185e-05, "epoch": 2.446378439079169, "percentage": 81.68, "elapsed_time": "1 day, 2:15:19", "remaining_time": "5:53:17"}
|
273 |
+
{"current_steps": 273, "total_steps": 333, "loss": 0.358, "lr": 1.537759702157482e-05, "epoch": 2.4553621560920833, "percentage": 81.98, "elapsed_time": "1 day, 2:20:54", "remaining_time": "5:47:27"}
|
274 |
+
{"current_steps": 274, "total_steps": 333, "loss": 0.3758, "lr": 1.4885676531740694e-05, "epoch": 2.464345873104997, "percentage": 82.28, "elapsed_time": "1 day, 2:26:40", "remaining_time": "5:41:39"}
|
275 |
+
{"current_steps": 275, "total_steps": 333, "loss": 0.366, "lr": 1.4400944403348321e-05, "epoch": 2.473329590117911, "percentage": 82.58, "elapsed_time": "1 day, 2:32:18", "remaining_time": "5:35:49"}
|
276 |
+
{"current_steps": 276, "total_steps": 333, "loss": 0.3702, "lr": 1.392345414889011e-05, "epoch": 2.482313307130825, "percentage": 82.88, "elapsed_time": "1 day, 2:38:21", "remaining_time": "5:30:05"}
|
277 |
+
{"current_steps": 277, "total_steps": 333, "loss": 0.3511, "lr": 1.345325848138451e-05, "epoch": 2.4912970241437393, "percentage": 83.18, "elapsed_time": "1 day, 2:44:09", "remaining_time": "5:24:18"}
|
278 |
+
{"current_steps": 278, "total_steps": 333, "loss": 0.3516, "lr": 1.2990409308556679e-05, "epoch": 2.5002807411566534, "percentage": 83.48, "elapsed_time": "1 day, 2:49:38", "remaining_time": "5:18:27"}
|
279 |
+
{"current_steps": 279, "total_steps": 333, "loss": 0.3633, "lr": 1.2534957727108083e-05, "epoch": 2.5092644581695676, "percentage": 83.78, "elapsed_time": "1 day, 2:55:12", "remaining_time": "5:12:37"}
|
280 |
+
{"current_steps": 280, "total_steps": 333, "loss": 0.3733, "lr": 1.208695401707562e-05, "epoch": 2.5182481751824817, "percentage": 84.08, "elapsed_time": "1 day, 3:00:58", "remaining_time": "5:06:49"}
|
281 |
+
{"current_steps": 281, "total_steps": 333, "loss": 0.3555, "lr": 1.1646447636280916e-05, "epoch": 2.527231892195396, "percentage": 84.38, "elapsed_time": "1 day, 3:06:41", "remaining_time": "5:01:01"}
|
282 |
+
{"current_steps": 282, "total_steps": 333, "loss": 0.359, "lr": 1.1213487214870366e-05, "epoch": 2.53621560920831, "percentage": 84.68, "elapsed_time": "1 day, 3:12:32", "remaining_time": "4:55:14"}
|
283 |
+
{"current_steps": 283, "total_steps": 333, "loss": 0.3744, "lr": 1.0788120549946535e-05, "epoch": 2.545199326221224, "percentage": 84.98, "elapsed_time": "1 day, 3:18:14", "remaining_time": "4:49:26"}
|
284 |
+
{"current_steps": 284, "total_steps": 333, "loss": 0.3508, "lr": 1.0370394600291633e-05, "epoch": 2.554183043234138, "percentage": 85.29, "elapsed_time": "1 day, 3:23:51", "remaining_time": "4:43:37"}
|
285 |
+
{"current_steps": 285, "total_steps": 333, "loss": 0.3789, "lr": 9.960355481183357e-06, "epoch": 2.5631667602470523, "percentage": 85.59, "elapsed_time": "1 day, 3:29:31", "remaining_time": "4:37:48"}
|
286 |
+
{"current_steps": 286, "total_steps": 333, "loss": 0.3667, "lr": 9.55804845930401e-06, "epoch": 2.5721504772599664, "percentage": 85.89, "elapsed_time": "1 day, 3:35:14", "remaining_time": "4:32:00"}
|
287 |
+
{"current_steps": 287, "total_steps": 333, "loss": 0.368, "lr": 9.163517947743218e-06, "epoch": 2.5811341942728805, "percentage": 86.19, "elapsed_time": "1 day, 3:40:53", "remaining_time": "4:26:12"}
|
288 |
+
{"current_steps": 288, "total_steps": 333, "loss": 0.3568, "lr": 8.776807501094891e-06, "epoch": 2.5901179112857946, "percentage": 86.49, "elapsed_time": "1 day, 3:46:42", "remaining_time": "4:20:25"}
|
289 |
+
{"current_steps": 289, "total_steps": 333, "loss": 0.3564, "lr": 8.397959810648992e-06, "epoch": 2.5991016282987087, "percentage": 86.79, "elapsed_time": "1 day, 3:52:24", "remaining_time": "4:14:37"}
|
290 |
+
{"current_steps": 290, "total_steps": 333, "loss": 0.3726, "lr": 8.027016699678581e-06, "epoch": 2.608085345311623, "percentage": 87.09, "elapsed_time": "1 day, 3:58:24", "remaining_time": "4:08:52"}
|
291 |
+
{"current_steps": 291, "total_steps": 333, "loss": 0.367, "lr": 7.664019118822676e-06, "epoch": 2.6170690623245365, "percentage": 87.39, "elapsed_time": "1 day, 4:04:04", "remaining_time": "4:03:03"}
|
292 |
+
{"current_steps": 292, "total_steps": 333, "loss": 0.3525, "lr": 7.30900714156551e-06, "epoch": 2.626052779337451, "percentage": 87.69, "elapsed_time": "1 day, 4:10:05", "remaining_time": "3:57:18"}
|
293 |
+
{"current_steps": 293, "total_steps": 333, "loss": 0.3699, "lr": 6.962019959812516e-06, "epoch": 2.6350364963503647, "percentage": 87.99, "elapsed_time": "1 day, 4:15:58", "remaining_time": "3:51:31"}
|
294 |
+
{"current_steps": 294, "total_steps": 333, "loss": 0.3665, "lr": 6.623095879563774e-06, "epoch": 2.6440202133632793, "percentage": 88.29, "elapsed_time": "1 day, 4:21:40", "remaining_time": "3:45:43"}
|
295 |
+
{"current_steps": 295, "total_steps": 333, "loss": 0.3583, "lr": 6.29227231668506e-06, "epoch": 2.653003930376193, "percentage": 88.59, "elapsed_time": "1 day, 4:27:30", "remaining_time": "3:39:56"}
|
296 |
+
{"current_steps": 296, "total_steps": 333, "loss": 0.3679, "lr": 5.9695857927774396e-06, "epoch": 2.661987647389107, "percentage": 88.89, "elapsed_time": "1 day, 4:33:21", "remaining_time": "3:34:10"}
|
297 |
+
{"current_steps": 297, "total_steps": 333, "loss": 0.3653, "lr": 5.655071931145317e-06, "epoch": 2.670971364402021, "percentage": 89.19, "elapsed_time": "1 day, 4:39:12", "remaining_time": "3:28:23"}
|
298 |
+
{"current_steps": 298, "total_steps": 333, "loss": 0.3646, "lr": 5.3487654528638025e-06, "epoch": 2.6799550814149353, "percentage": 89.49, "elapsed_time": "1 day, 4:45:07", "remaining_time": "3:22:36"}
|
299 |
+
{"current_steps": 299, "total_steps": 333, "loss": 0.3577, "lr": 5.050700172945631e-06, "epoch": 2.6889387984278494, "percentage": 89.79, "elapsed_time": "1 day, 4:50:58", "remaining_time": "3:16:50"}
|
300 |
+
{"current_steps": 300, "total_steps": 333, "loss": 0.3564, "lr": 4.760908996608145e-06, "epoch": 2.6979225154407636, "percentage": 90.09, "elapsed_time": "1 day, 4:56:46", "remaining_time": "3:11:02"}
|
301 |
+
{"current_steps": 301, "total_steps": 333, "loss": 0.3654, "lr": 4.47942391564066e-06, "epoch": 2.7069062324536777, "percentage": 90.39, "elapsed_time": "1 day, 5:02:33", "remaining_time": "3:05:15"}
|
302 |
+
{"current_steps": 302, "total_steps": 333, "loss": 0.372, "lr": 4.206276004872729e-06, "epoch": 2.715889949466592, "percentage": 90.69, "elapsed_time": "1 day, 5:08:33", "remaining_time": "2:59:29"}
|
303 |
+
{"current_steps": 303, "total_steps": 333, "loss": 0.3588, "lr": 3.941495418743557e-06, "epoch": 2.724873666479506, "percentage": 90.99, "elapsed_time": "1 day, 5:14:19", "remaining_time": "2:53:41"}
|
304 |
+
{"current_steps": 304, "total_steps": 333, "loss": 0.3545, "lr": 3.685111387973139e-06, "epoch": 2.73385738349242, "percentage": 91.29, "elapsed_time": "1 day, 5:19:56", "remaining_time": "2:47:53"}
|
305 |
+
{"current_steps": 305, "total_steps": 333, "loss": 0.3634, "lr": 3.4371522163352444e-06, "epoch": 2.742841100505334, "percentage": 91.59, "elapsed_time": "1 day, 5:25:18", "remaining_time": "2:42:03"}
|
306 |
+
{"current_steps": 306, "total_steps": 333, "loss": 0.3557, "lr": 3.1976452775328302e-06, "epoch": 2.7518248175182483, "percentage": 91.89, "elapsed_time": "1 day, 5:31:10", "remaining_time": "2:36:16"}
|
307 |
+
{"current_steps": 307, "total_steps": 333, "loss": 0.3652, "lr": 2.9666170121760698e-06, "epoch": 2.7608085345311624, "percentage": 92.19, "elapsed_time": "1 day, 5:36:50", "remaining_time": "2:30:28"}
|
308 |
+
{"current_steps": 308, "total_steps": 333, "loss": 0.3493, "lr": 2.7440929248634216e-06, "epoch": 2.7697922515440765, "percentage": 92.49, "elapsed_time": "1 day, 5:42:28", "remaining_time": "2:24:40"}
|
309 |
+
{"current_steps": 309, "total_steps": 333, "loss": 0.3799, "lr": 2.5300975813660467e-06, "epoch": 2.7787759685569906, "percentage": 92.79, "elapsed_time": "1 day, 5:48:24", "remaining_time": "2:18:54"}
|
310 |
+
{"current_steps": 310, "total_steps": 333, "loss": 0.3485, "lr": 2.324654605915839e-06, "epoch": 2.7877596855699043, "percentage": 93.09, "elapsed_time": "1 day, 5:53:51", "remaining_time": "2:13:05"}
|
311 |
+
{"current_steps": 311, "total_steps": 333, "loss": 0.3685, "lr": 2.127786678597348e-06, "epoch": 2.796743402582819, "percentage": 93.39, "elapsed_time": "1 day, 5:59:34", "remaining_time": "2:07:18"}
|
312 |
+
{"current_steps": 312, "total_steps": 333, "loss": 0.3665, "lr": 1.9395155328440605e-06, "epoch": 2.8057271195957325, "percentage": 93.69, "elapsed_time": "1 day, 6:05:13", "remaining_time": "2:01:30"}
|
313 |
+
{"current_steps": 313, "total_steps": 333, "loss": 0.3597, "lr": 1.7598619530390904e-06, "epoch": 2.814710836608647, "percentage": 93.99, "elapsed_time": "1 day, 6:11:16", "remaining_time": "1:55:44"}
|
314 |
+
{"current_steps": 314, "total_steps": 333, "loss": 0.3651, "lr": 1.5888457722206529e-06, "epoch": 2.8236945536215607, "percentage": 94.29, "elapsed_time": "1 day, 6:17:16", "remaining_time": "1:49:57"}
|
315 |
+
{"current_steps": 315, "total_steps": 333, "loss": 0.3596, "lr": 1.4264858698926022e-06, "epoch": 2.832678270634475, "percentage": 94.59, "elapsed_time": "1 day, 6:23:02", "remaining_time": "1:44:10"}
|
316 |
+
{"current_steps": 316, "total_steps": 333, "loss": 0.3632, "lr": 1.2728001699401583e-06, "epoch": 2.841661987647389, "percentage": 94.89, "elapsed_time": "1 day, 6:29:00", "remaining_time": "1:38:23"}
|
317 |
+
{"current_steps": 317, "total_steps": 333, "loss": 0.3698, "lr": 1.1278056386512514e-06, "epoch": 2.850645704660303, "percentage": 95.2, "elapsed_time": "1 day, 6:34:48", "remaining_time": "1:32:36"}
|
318 |
+
{"current_steps": 318, "total_steps": 333, "loss": 0.3634, "lr": 9.915182828434688e-07, "epoch": 2.859629421673217, "percentage": 95.5, "elapsed_time": "1 day, 6:40:45", "remaining_time": "1:26:49"}
|
319 |
+
{"current_steps": 319, "total_steps": 333, "loss": 0.3589, "lr": 8.639531480969787e-07, "epoch": 2.8686131386861313, "percentage": 95.8, "elapsed_time": "1 day, 6:46:28", "remaining_time": "1:21:02"}
|
320 |
+
{"current_steps": 320, "total_steps": 333, "loss": 0.3684, "lr": 7.451243170935396e-07, "epoch": 2.8775968556990454, "percentage": 96.1, "elapsed_time": "1 day, 6:52:29", "remaining_time": "1:15:15"}
|
321 |
+
{"current_steps": 321, "total_steps": 333, "loss": 0.3617, "lr": 6.350449080618593e-07, "epoch": 2.8865805727119596, "percentage": 96.4, "elapsed_time": "1 day, 6:58:32", "remaining_time": "1:09:28"}
|
322 |
+
{"current_steps": 322, "total_steps": 333, "loss": 0.3613, "lr": 5.337270733293665e-07, "epoch": 2.8955642897248737, "percentage": 96.7, "elapsed_time": "1 day, 7:04:11", "remaining_time": "1:03:41"}
|
323 |
+
{"current_steps": 323, "total_steps": 333, "loss": 0.3654, "lr": 4.4118199798066195e-07, "epoch": 2.904548006737788, "percentage": 97.0, "elapsed_time": "1 day, 7:09:54", "remaining_time": "0:57:53"}
|
324 |
+
{"current_steps": 324, "total_steps": 333, "loss": 0.3592, "lr": 3.5741989862271955e-07, "epoch": 2.913531723750702, "percentage": 97.3, "elapsed_time": "1 day, 7:15:41", "remaining_time": "0:52:06"}
|
325 |
+
{"current_steps": 325, "total_steps": 333, "loss": 0.3694, "lr": 2.824500222570148e-07, "epoch": 2.922515440763616, "percentage": 97.6, "elapsed_time": "1 day, 7:21:21", "remaining_time": "0:46:18"}
|
326 |
+
{"current_steps": 326, "total_steps": 333, "loss": 0.3545, "lr": 2.162806452587063e-07, "epoch": 2.93149915777653, "percentage": 97.9, "elapsed_time": "1 day, 7:27:13", "remaining_time": "0:40:31"}
|
327 |
+
{"current_steps": 327, "total_steps": 333, "loss": 0.3521, "lr": 1.5891907246292192e-07, "epoch": 2.9404828747894443, "percentage": 98.2, "elapsed_time": "1 day, 7:33:07", "remaining_time": "0:34:44"}
|
328 |
+
{"current_steps": 328, "total_steps": 333, "loss": 0.3645, "lr": 1.103716363583729e-07, "epoch": 2.9494665918023584, "percentage": 98.5, "elapsed_time": "1 day, 7:38:56", "remaining_time": "0:28:56"}
|
329 |
+
{"current_steps": 329, "total_steps": 333, "loss": 0.36, "lr": 7.064369638825064e-08, "epoch": 2.958450308815272, "percentage": 98.8, "elapsed_time": "1 day, 7:44:48", "remaining_time": "0:23:09"}
|
330 |
+
{"current_steps": 330, "total_steps": 333, "loss": 0.363, "lr": 3.973963835858463e-08, "epoch": 2.9674340258281866, "percentage": 99.1, "elapsed_time": "1 day, 7:50:23", "remaining_time": "0:17:22"}
|
331 |
+
{"current_steps": 331, "total_steps": 333, "loss": 0.3659, "lr": 1.766287395404298e-08, "epoch": 2.9764177428411003, "percentage": 99.4, "elapsed_time": "1 day, 7:56:32", "remaining_time": "0:11:34"}
|
332 |
+
{"current_steps": 332, "total_steps": 333, "loss": 0.3593, "lr": 4.415840361300383e-09, "epoch": 2.985401459854015, "percentage": 99.7, "elapsed_time": "1 day, 8:02:20", "remaining_time": "0:05:47"}
|
333 |
+
{"current_steps": 333, "total_steps": 333, "loss": 0.3626, "lr": 0.0, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 8:08:14", "remaining_time": "0:00:00"}
|
334 |
+
{"current_steps": 333, "total_steps": 333, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 8:09:48", "remaining_time": "0:00:00"}
|