Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91c6d95bae0d66d5b019c517000937831972dd99b104c05d6807889bc13603d8
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8a3b9a4e5a2317467c8aa9dc80ef6acdb2610cad7c09a3a839c05563f2285ea
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:659714acac33b060a1a9b4d6e9123dec6a80e0563fb278dea34fc66295a563d6
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0699445c52be2a6779d8297c4f375b44d7696a6ae7015b6245d8d0b28637db86
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -220,3 +220,115 @@
|
|
220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4141, "lr": 7.080412386299138e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:10:10", "remaining_time": "10:52:24"}
|
221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.4029, "lr": 6.970410144101348e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:15:40", "remaining_time": "10:46:29"}
|
222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4266, "lr": 6.860887383769717e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:21:40", "remaining_time": "10:40:50"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4141, "lr": 7.080412386299138e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:10:10", "remaining_time": "10:52:24"}
|
221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.4029, "lr": 6.970410144101348e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:15:40", "remaining_time": "10:46:29"}
|
222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4266, "lr": 6.860887383769717e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:21:40", "remaining_time": "10:40:50"}
|
223 |
+
{"current_steps": 223, "total_steps": 333, "loss": 0.7214, "lr": 6.751856196179887e-05, "epoch": 2.0061763054463784, "percentage": 66.97, "elapsed_time": "21:28:07", "remaining_time": "10:35:24"}
|
224 |
+
{"current_steps": 224, "total_steps": 333, "loss": 0.3541, "lr": 6.643328617939827e-05, "epoch": 2.0151600224592925, "percentage": 67.27, "elapsed_time": "21:33:49", "remaining_time": "10:29:35"}
|
225 |
+
{"current_steps": 225, "total_steps": 333, "loss": 0.3741, "lr": 6.53531663006105e-05, "epoch": 2.0241437394722066, "percentage": 67.57, "elapsed_time": "21:39:52", "remaining_time": "10:23:56"}
|
226 |
+
{"current_steps": 226, "total_steps": 333, "loss": 0.3623, "lr": 6.427832156635937e-05, "epoch": 2.0331274564851207, "percentage": 67.87, "elapsed_time": "21:45:39", "remaining_time": "10:18:10"}
|
227 |
+
{"current_steps": 227, "total_steps": 333, "loss": 0.3666, "lr": 6.320887063521393e-05, "epoch": 2.042111173498035, "percentage": 68.17, "elapsed_time": "21:51:39", "remaining_time": "10:12:29"}
|
228 |
+
{"current_steps": 228, "total_steps": 333, "loss": 0.3588, "lr": 6.214493157028881e-05, "epoch": 2.051094890510949, "percentage": 68.47, "elapsed_time": "21:57:29", "remaining_time": "10:06:44"}
|
229 |
+
{"current_steps": 229, "total_steps": 333, "loss": 0.3734, "lr": 6.108662182621064e-05, "epoch": 2.060078607523863, "percentage": 68.77, "elapsed_time": "22:03:11", "remaining_time": "10:00:55"}
|
230 |
+
{"current_steps": 230, "total_steps": 333, "loss": 0.3595, "lr": 6.003405823615149e-05, "epoch": 2.069062324536777, "percentage": 69.07, "elapsed_time": "22:08:57", "remaining_time": "9:55:08"}
|
231 |
+
{"current_steps": 231, "total_steps": 333, "loss": 0.3605, "lr": 5.898735699893096e-05, "epoch": 2.0780460415496913, "percentage": 69.37, "elapsed_time": "22:14:58", "remaining_time": "9:49:28"}
|
232 |
+
{"current_steps": 232, "total_steps": 333, "loss": 0.3632, "lr": 5.794663366618828e-05, "epoch": 2.0870297585626054, "percentage": 69.67, "elapsed_time": "22:20:45", "remaining_time": "9:43:41"}
|
233 |
+
{"current_steps": 233, "total_steps": 333, "loss": 0.3498, "lr": 5.691200312962588e-05, "epoch": 2.0960134755755195, "percentage": 69.97, "elapsed_time": "22:26:39", "remaining_time": "9:37:57"}
|
234 |
+
{"current_steps": 234, "total_steps": 333, "loss": 0.3629, "lr": 5.5883579608325826e-05, "epoch": 2.1049971925884337, "percentage": 70.27, "elapsed_time": "22:32:08", "remaining_time": "9:32:03"}
|
235 |
+
{"current_steps": 235, "total_steps": 333, "loss": 0.3616, "lr": 5.486147663614048e-05, "epoch": 2.1139809096013478, "percentage": 70.57, "elapsed_time": "22:37:59", "remaining_time": "9:26:18"}
|
236 |
+
{"current_steps": 236, "total_steps": 333, "loss": 0.3568, "lr": 5.3845807049158815e-05, "epoch": 2.1229646266142614, "percentage": 70.87, "elapsed_time": "22:43:48", "remaining_time": "9:20:33"}
|
237 |
+
{"current_steps": 237, "total_steps": 333, "loss": 0.3655, "lr": 5.2836682973249665e-05, "epoch": 2.1319483436271756, "percentage": 71.17, "elapsed_time": "22:49:43", "remaining_time": "9:14:49"}
|
238 |
+
{"current_steps": 238, "total_steps": 333, "loss": 0.3549, "lr": 5.1834215811683654e-05, "epoch": 2.1409320606400897, "percentage": 71.47, "elapsed_time": "22:55:27", "remaining_time": "9:09:01"}
|
239 |
+
{"current_steps": 239, "total_steps": 333, "loss": 0.3566, "lr": 5.0838516232834614e-05, "epoch": 2.149915777653004, "percentage": 71.77, "elapsed_time": "23:01:10", "remaining_time": "9:03:13"}
|
240 |
+
{"current_steps": 240, "total_steps": 333, "loss": 0.3588, "lr": 4.9849694157962234e-05, "epoch": 2.158899494665918, "percentage": 72.07, "elapsed_time": "23:06:47", "remaining_time": "8:57:22"}
|
241 |
+
{"current_steps": 241, "total_steps": 333, "loss": 0.3488, "lr": 4.886785874907724e-05, "epoch": 2.167883211678832, "percentage": 72.37, "elapsed_time": "23:12:37", "remaining_time": "8:51:37"}
|
242 |
+
{"current_steps": 242, "total_steps": 333, "loss": 0.3715, "lr": 4.7893118396890284e-05, "epoch": 2.176866928691746, "percentage": 72.67, "elapsed_time": "23:18:26", "remaining_time": "8:45:51"}
|
243 |
+
{"current_steps": 243, "total_steps": 333, "loss": 0.3765, "lr": 4.6925580708846104e-05, "epoch": 2.1858506457046603, "percentage": 72.97, "elapsed_time": "23:24:06", "remaining_time": "8:40:02"}
|
244 |
+
{"current_steps": 244, "total_steps": 333, "loss": 0.3519, "lr": 4.596535249724404e-05, "epoch": 2.1948343627175744, "percentage": 73.27, "elapsed_time": "23:29:31", "remaining_time": "8:34:07"}
|
245 |
+
{"current_steps": 245, "total_steps": 333, "loss": 0.3561, "lr": 4.501253976744641e-05, "epoch": 2.2038180797304885, "percentage": 73.57, "elapsed_time": "23:35:11", "remaining_time": "8:28:18"}
|
246 |
+
{"current_steps": 246, "total_steps": 333, "loss": 0.3515, "lr": 4.406724770617595e-05, "epoch": 2.2128017967434026, "percentage": 73.87, "elapsed_time": "23:40:51", "remaining_time": "8:22:29"}
|
247 |
+
{"current_steps": 247, "total_steps": 333, "loss": 0.3612, "lr": 4.3129580669903586e-05, "epoch": 2.2217855137563167, "percentage": 74.17, "elapsed_time": "23:46:34", "remaining_time": "8:16:42"}
|
248 |
+
{"current_steps": 248, "total_steps": 333, "loss": 0.3482, "lr": 4.2199642173327955e-05, "epoch": 2.230769230769231, "percentage": 74.47, "elapsed_time": "23:52:08", "remaining_time": "8:10:51"}
|
249 |
+
{"current_steps": 249, "total_steps": 333, "loss": 0.3559, "lr": 4.127753487794768e-05, "epoch": 2.239752947782145, "percentage": 74.77, "elapsed_time": "23:57:52", "remaining_time": "8:05:03"}
|
250 |
+
{"current_steps": 250, "total_steps": 333, "loss": 0.356, "lr": 4.036336058072806e-05, "epoch": 2.248736664795059, "percentage": 75.08, "elapsed_time": "1 day, 0:03:32", "remaining_time": "7:59:15"}
|
251 |
+
{"current_steps": 251, "total_steps": 333, "loss": 0.3606, "lr": 3.9457220202863104e-05, "epoch": 2.257720381807973, "percentage": 75.38, "elapsed_time": "1 day, 0:09:29", "remaining_time": "7:53:32"}
|
252 |
+
{"current_steps": 252, "total_steps": 333, "loss": 0.3667, "lr": 3.855921377863414e-05, "epoch": 2.2667040988208873, "percentage": 75.68, "elapsed_time": "1 day, 0:15:31", "remaining_time": "7:47:50"}
|
253 |
+
{"current_steps": 253, "total_steps": 333, "loss": 0.3548, "lr": 3.766944044436649e-05, "epoch": 2.2756878158338014, "percentage": 75.98, "elapsed_time": "1 day, 0:21:04", "remaining_time": "7:42:00"}
|
254 |
+
{"current_steps": 254, "total_steps": 333, "loss": 0.3716, "lr": 3.678799842748521e-05, "epoch": 2.2846715328467155, "percentage": 76.28, "elapsed_time": "1 day, 0:26:58", "remaining_time": "7:36:15"}
|
255 |
+
{"current_steps": 255, "total_steps": 333, "loss": 0.3571, "lr": 3.5914985035671156e-05, "epoch": 2.293655249859629, "percentage": 76.58, "elapsed_time": "1 day, 0:32:55", "remaining_time": "7:30:32"}
|
256 |
+
{"current_steps": 256, "total_steps": 333, "loss": 0.3655, "lr": 3.5050496646118584e-05, "epoch": 2.3026389668725433, "percentage": 76.88, "elapsed_time": "1 day, 0:38:31", "remaining_time": "7:24:42"}
|
257 |
+
{"current_steps": 257, "total_steps": 333, "loss": 0.364, "lr": 3.4194628694895594e-05, "epoch": 2.3116226838854574, "percentage": 77.18, "elapsed_time": "1 day, 0:44:21", "remaining_time": "7:18:57"}
|
258 |
+
{"current_steps": 258, "total_steps": 333, "loss": 0.351, "lr": 3.334747566640824e-05, "epoch": 2.3206064008983716, "percentage": 77.48, "elapsed_time": "1 day, 0:50:14", "remaining_time": "7:13:12"}
|
259 |
+
{"current_steps": 259, "total_steps": 333, "loss": 0.3687, "lr": 3.2509131082969915e-05, "epoch": 2.3295901179112857, "percentage": 77.78, "elapsed_time": "1 day, 0:56:05", "remaining_time": "7:07:27"}
|
260 |
+
{"current_steps": 260, "total_steps": 333, "loss": 0.3454, "lr": 3.167968749447683e-05, "epoch": 2.3385738349242, "percentage": 78.08, "elapsed_time": "1 day, 1:01:38", "remaining_time": "7:01:37"}
|
261 |
+
{"current_steps": 261, "total_steps": 333, "loss": 0.3654, "lr": 3.0859236468190844e-05, "epoch": 2.347557551937114, "percentage": 78.38, "elapsed_time": "1 day, 1:07:11", "remaining_time": "6:55:46"}
|
262 |
+
{"current_steps": 262, "total_steps": 333, "loss": 0.3617, "lr": 3.00478685786309e-05, "epoch": 2.356541268950028, "percentage": 78.68, "elapsed_time": "1 day, 1:12:49", "remaining_time": "6:49:57"}
|
263 |
+
{"current_steps": 263, "total_steps": 333, "loss": 0.3582, "lr": 2.9245673397573843e-05, "epoch": 2.365524985962942, "percentage": 78.98, "elapsed_time": "1 day, 1:18:42", "remaining_time": "6:44:13"}
|
264 |
+
{"current_steps": 264, "total_steps": 333, "loss": 0.3628, "lr": 2.8452739484166123e-05, "epoch": 2.3745087029758563, "percentage": 79.28, "elapsed_time": "1 day, 1:24:23", "remaining_time": "6:38:25"}
|
265 |
+
{"current_steps": 265, "total_steps": 333, "loss": 0.3617, "lr": 2.7669154375147227e-05, "epoch": 2.3834924199887704, "percentage": 79.58, "elapsed_time": "1 day, 1:30:15", "remaining_time": "6:32:40"}
|
266 |
+
{"current_steps": 266, "total_steps": 333, "loss": 0.3657, "lr": 2.6895004575185922e-05, "epoch": 2.3924761370016845, "percentage": 79.88, "elapsed_time": "1 day, 1:36:03", "remaining_time": "6:26:54"}
|
267 |
+
{"current_steps": 267, "total_steps": 333, "loss": 0.3519, "lr": 2.6130375547330496e-05, "epoch": 2.4014598540145986, "percentage": 80.18, "elapsed_time": "1 day, 1:41:53", "remaining_time": "6:21:08"}
|
268 |
+
{"current_steps": 268, "total_steps": 333, "loss": 0.3631, "lr": 2.5375351703574044e-05, "epoch": 2.4104435710275127, "percentage": 80.48, "elapsed_time": "1 day, 1:47:52", "remaining_time": "6:15:25"}
|
269 |
+
{"current_steps": 269, "total_steps": 333, "loss": 0.3679, "lr": 2.4630016395535618e-05, "epoch": 2.419427288040427, "percentage": 80.78, "elapsed_time": "1 day, 1:53:35", "remaining_time": "6:09:37"}
|
270 |
+
{"current_steps": 270, "total_steps": 333, "loss": 0.3475, "lr": 2.389445190525866e-05, "epoch": 2.428411005053341, "percentage": 81.08, "elapsed_time": "1 day, 1:59:16", "remaining_time": "6:03:49"}
|
271 |
+
{"current_steps": 271, "total_steps": 333, "loss": 0.3509, "lr": 2.316873943612722e-05, "epoch": 2.437394722066255, "percentage": 81.38, "elapsed_time": "1 day, 2:05:17", "remaining_time": "5:58:06"}
|
272 |
+
{"current_steps": 272, "total_steps": 333, "loss": 0.3597, "lr": 2.2452959103901613e-05, "epoch": 2.446378439079169, "percentage": 81.68, "elapsed_time": "1 day, 2:11:15", "remaining_time": "5:52:22"}
|
273 |
+
{"current_steps": 273, "total_steps": 333, "loss": 0.3515, "lr": 2.1747189927873877e-05, "epoch": 2.4553621560920833, "percentage": 81.98, "elapsed_time": "1 day, 2:16:48", "remaining_time": "5:46:33"}
|
274 |
+
{"current_steps": 274, "total_steps": 333, "loss": 0.3695, "lr": 2.1051509822144332e-05, "epoch": 2.464345873104997, "percentage": 82.28, "elapsed_time": "1 day, 2:22:33", "remaining_time": "5:40:46"}
|
275 |
+
{"current_steps": 275, "total_steps": 333, "loss": 0.3592, "lr": 2.0365995587020234e-05, "epoch": 2.473329590117911, "percentage": 82.58, "elapsed_time": "1 day, 2:28:10", "remaining_time": "5:34:57"}
|
276 |
+
{"current_steps": 276, "total_steps": 333, "loss": 0.3634, "lr": 1.969072290053725e-05, "epoch": 2.482313307130825, "percentage": 82.88, "elapsed_time": "1 day, 2:34:10", "remaining_time": "5:29:13"}
|
277 |
+
{"current_steps": 277, "total_steps": 333, "loss": 0.3444, "lr": 1.902576631010499e-05, "epoch": 2.4912970241437393, "percentage": 83.18, "elapsed_time": "1 day, 2:39:58", "remaining_time": "5:23:27"}
|
278 |
+
{"current_steps": 278, "total_steps": 333, "loss": 0.3446, "lr": 1.8371199224277213e-05, "epoch": 2.5002807411566534, "percentage": 83.48, "elapsed_time": "1 day, 2:45:26", "remaining_time": "5:17:37"}
|
279 |
+
{"current_steps": 279, "total_steps": 333, "loss": 0.3565, "lr": 1.772709390464784e-05, "epoch": 2.5092644581695676, "percentage": 83.78, "elapsed_time": "1 day, 2:51:00", "remaining_time": "5:11:48"}
|
280 |
+
{"current_steps": 280, "total_steps": 333, "loss": 0.3667, "lr": 1.7093521457873555e-05, "epoch": 2.5182481751824817, "percentage": 84.08, "elapsed_time": "1 day, 2:56:45", "remaining_time": "5:06:01"}
|
281 |
+
{"current_steps": 281, "total_steps": 333, "loss": 0.3486, "lr": 1.647055182782392e-05, "epoch": 2.527231892195396, "percentage": 84.38, "elapsed_time": "1 day, 3:02:28", "remaining_time": "5:00:14"}
|
282 |
+
{"current_steps": 282, "total_steps": 333, "loss": 0.3525, "lr": 1.5858253787859857e-05, "epoch": 2.53621560920831, "percentage": 84.68, "elapsed_time": "1 day, 3:08:16", "remaining_time": "4:54:28"}
|
283 |
+
{"current_steps": 283, "total_steps": 333, "loss": 0.3675, "lr": 1.5256694933241261e-05, "epoch": 2.545199326221224, "percentage": 84.98, "elapsed_time": "1 day, 3:13:58", "remaining_time": "4:48:41"}
|
284 |
+
{"current_steps": 284, "total_steps": 333, "loss": 0.3443, "lr": 1.466594167366493e-05, "epoch": 2.554183043234138, "percentage": 85.29, "elapsed_time": "1 day, 3:19:34", "remaining_time": "4:42:53"}
|
285 |
+
{"current_steps": 285, "total_steps": 333, "loss": 0.3719, "lr": 1.4086059225933016e-05, "epoch": 2.5631667602470523, "percentage": 85.59, "elapsed_time": "1 day, 3:25:13", "remaining_time": "4:37:05"}
|
286 |
+
{"current_steps": 286, "total_steps": 333, "loss": 0.3605, "lr": 1.3517111606753471e-05, "epoch": 2.5721504772599664, "percentage": 85.89, "elapsed_time": "1 day, 3:30:57", "remaining_time": "4:31:18"}
|
287 |
+
{"current_steps": 287, "total_steps": 333, "loss": 0.3616, "lr": 1.2959161625672802e-05, "epoch": 2.5811341942728805, "percentage": 86.19, "elapsed_time": "1 day, 3:36:35", "remaining_time": "4:25:30"}
|
288 |
+
{"current_steps": 288, "total_steps": 333, "loss": 0.3501, "lr": 1.2412270878142156e-05, "epoch": 2.5901179112857946, "percentage": 86.49, "elapsed_time": "1 day, 3:42:23", "remaining_time": "4:19:44"}
|
289 |
+
{"current_steps": 289, "total_steps": 333, "loss": 0.3503, "lr": 1.1876499738717436e-05, "epoch": 2.5991016282987087, "percentage": 86.79, "elapsed_time": "1 day, 3:48:04", "remaining_time": "4:13:57"}
|
290 |
+
{"current_steps": 290, "total_steps": 333, "loss": 0.3657, "lr": 1.1351907354394194e-05, "epoch": 2.608085345311623, "percentage": 87.09, "elapsed_time": "1 day, 3:54:02", "remaining_time": "4:08:13"}
|
291 |
+
{"current_steps": 291, "total_steps": 333, "loss": 0.3603, "lr": 1.0838551638078013e-05, "epoch": 2.6170690623245365, "percentage": 87.39, "elapsed_time": "1 day, 3:59:41", "remaining_time": "4:02:25"}
|
292 |
+
{"current_steps": 292, "total_steps": 333, "loss": 0.3462, "lr": 1.0336489262191212e-05, "epoch": 2.626052779337451, "percentage": 87.69, "elapsed_time": "1 day, 4:05:42", "remaining_time": "3:56:41"}
|
293 |
+
{"current_steps": 293, "total_steps": 333, "loss": 0.3632, "lr": 9.845775652416357e-06, "epoch": 2.6350364963503647, "percentage": 87.99, "elapsed_time": "1 day, 4:11:33", "remaining_time": "3:50:55"}
|
294 |
+
{"current_steps": 294, "total_steps": 333, "loss": 0.3594, "lr": 9.366464981577584e-06, "epoch": 2.6440202133632793, "percentage": 88.29, "elapsed_time": "1 day, 4:17:14", "remaining_time": "3:45:08"}
|
295 |
+
{"current_steps": 295, "total_steps": 333, "loss": 0.3515, "lr": 8.89861016365997e-06, "epoch": 2.653003930376193, "percentage": 88.59, "elapsed_time": "1 day, 4:23:03", "remaining_time": "3:39:22"}
|
296 |
+
{"current_steps": 296, "total_steps": 333, "loss": 0.3608, "lr": 8.442262847968263e-06, "epoch": 2.661987647389107, "percentage": 88.89, "elapsed_time": "1 day, 4:28:54", "remaining_time": "3:33:36"}
|
297 |
+
{"current_steps": 297, "total_steps": 333, "loss": 0.3592, "lr": 7.997473413424846e-06, "epoch": 2.670971364402021, "percentage": 89.19, "elapsed_time": "1 day, 4:34:43", "remaining_time": "3:27:50"}
|
298 |
+
{"current_steps": 298, "total_steps": 333, "loss": 0.358, "lr": 7.564290963008149e-06, "epoch": 2.6799550814149353, "percentage": 89.49, "elapsed_time": "1 day, 4:40:37", "remaining_time": "3:22:05"}
|
299 |
+
{"current_steps": 299, "total_steps": 333, "loss": 0.351, "lr": 7.142763318331872e-06, "epoch": 2.6889387984278494, "percentage": 89.79, "elapsed_time": "1 day, 4:46:27", "remaining_time": "3:16:19"}
|
300 |
+
{"current_steps": 300, "total_steps": 333, "loss": 0.3494, "lr": 6.732937014365695e-06, "epoch": 2.6979225154407636, "percentage": 90.09, "elapsed_time": "1 day, 4:52:13", "remaining_time": "3:10:32"}
|
301 |
+
{"current_steps": 301, "total_steps": 333, "loss": 0.3587, "lr": 6.3348572942979654e-06, "epoch": 2.7069062324536777, "percentage": 90.39, "elapsed_time": "1 day, 4:58:01", "remaining_time": "3:04:46"}
|
302 |
+
{"current_steps": 302, "total_steps": 333, "loss": 0.3651, "lr": 5.948568104541074e-06, "epoch": 2.715889949466592, "percentage": 90.69, "elapsed_time": "1 day, 5:04:00", "remaining_time": "2:59:01"}
|
303 |
+
{"current_steps": 303, "total_steps": 333, "loss": 0.3523, "lr": 5.574112089879872e-06, "epoch": 2.724873666479506, "percentage": 90.99, "elapsed_time": "1 day, 5:09:45", "remaining_time": "2:53:14"}
|
304 |
+
{"current_steps": 304, "total_steps": 333, "loss": 0.3482, "lr": 5.211530588763962e-06, "epoch": 2.73385738349242, "percentage": 91.29, "elapsed_time": "1 day, 5:15:21", "remaining_time": "2:47:27"}
|
305 |
+
{"current_steps": 305, "total_steps": 333, "loss": 0.3564, "lr": 4.860863628744007e-06, "epoch": 2.742841100505334, "percentage": 91.59, "elapsed_time": "1 day, 5:20:43", "remaining_time": "2:41:38"}
|
306 |
+
{"current_steps": 306, "total_steps": 333, "loss": 0.3491, "lr": 4.522149922052897e-06, "epoch": 2.7518248175182483, "percentage": 91.89, "elapsed_time": "1 day, 5:26:34", "remaining_time": "2:35:52"}
|
307 |
+
{"current_steps": 307, "total_steps": 333, "loss": 0.3588, "lr": 4.195426861332049e-06, "epoch": 2.7608085345311624, "percentage": 92.19, "elapsed_time": "1 day, 5:32:14", "remaining_time": "2:30:05"}
|
308 |
+
{"current_steps": 308, "total_steps": 333, "loss": 0.3427, "lr": 3.880730515503412e-06, "epoch": 2.7697922515440765, "percentage": 92.49, "elapsed_time": "1 day, 5:37:51", "remaining_time": "2:24:18"}
|
309 |
+
{"current_steps": 309, "total_steps": 333, "loss": 0.3728, "lr": 3.57809562578763e-06, "epoch": 2.7787759685569906, "percentage": 92.79, "elapsed_time": "1 day, 5:43:46", "remaining_time": "2:18:32"}
|
310 |
+
{"current_steps": 310, "total_steps": 333, "loss": 0.3418, "lr": 3.2875556018687533e-06, "epoch": 2.7877596855699043, "percentage": 93.09, "elapsed_time": "1 day, 5:49:13", "remaining_time": "2:12:44"}
|
311 |
+
{"current_steps": 311, "total_steps": 333, "loss": 0.3617, "lr": 3.0091425182058514e-06, "epoch": 2.796743402582819, "percentage": 93.39, "elapsed_time": "1 day, 5:54:56", "remaining_time": "2:06:58"}
|
312 |
+
{"current_steps": 312, "total_steps": 333, "loss": 0.3602, "lr": 2.742887110492231e-06, "epoch": 2.8057271195957325, "percentage": 93.69, "elapsed_time": "1 day, 6:00:34", "remaining_time": "2:01:11"}
|
313 |
+
{"current_steps": 313, "total_steps": 333, "loss": 0.3532, "lr": 2.4888187722622945e-06, "epoch": 2.814710836608647, "percentage": 93.99, "elapsed_time": "1 day, 6:06:35", "remaining_time": "1:55:26"}
|
314 |
+
{"current_steps": 314, "total_steps": 333, "loss": 0.3579, "lr": 2.2469655516466e-06, "epoch": 2.8236945536215607, "percentage": 94.29, "elapsed_time": "1 day, 6:12:34", "remaining_time": "1:49:40"}
|
315 |
+
{"current_steps": 315, "total_steps": 333, "loss": 0.3527, "lr": 2.017354148275491e-06, "epoch": 2.832678270634475, "percentage": 94.59, "elapsed_time": "1 day, 6:18:19", "remaining_time": "1:43:54"}
|
316 |
+
{"current_steps": 316, "total_steps": 333, "loss": 0.357, "lr": 1.8000099103314957e-06, "epoch": 2.841661987647389, "percentage": 94.89, "elapsed_time": "1 day, 6:24:16", "remaining_time": "1:38:08"}
|
317 |
+
{"current_steps": 317, "total_steps": 333, "loss": 0.3633, "lr": 1.5949568317510827e-06, "epoch": 2.850645704660303, "percentage": 95.2, "elapsed_time": "1 day, 6:30:05", "remaining_time": "1:32:22"}
|
318 |
+
{"current_steps": 318, "total_steps": 333, "loss": 0.357, "lr": 1.402217549575769e-06, "epoch": 2.859629421673217, "percentage": 95.5, "elapsed_time": "1 day, 6:35:59", "remaining_time": "1:26:36"}
|
319 |
+
{"current_steps": 319, "total_steps": 333, "loss": 0.3528, "lr": 1.2218133414530984e-06, "epoch": 2.8686131386861313, "percentage": 95.8, "elapsed_time": "1 day, 6:41:41", "remaining_time": "1:20:49"}
|
320 |
+
{"current_steps": 320, "total_steps": 333, "loss": 0.3614, "lr": 1.0537641232876473e-06, "epoch": 2.8775968556990454, "percentage": 96.1, "elapsed_time": "1 day, 6:47:41", "remaining_time": "1:15:03"}
|
321 |
+
{"current_steps": 321, "total_steps": 333, "loss": 0.3551, "lr": 8.980884470424321e-07, "epoch": 2.8865805727119596, "percentage": 96.4, "elapsed_time": "1 day, 6:53:44", "remaining_time": "1:09:17"}
|
322 |
+
{"current_steps": 322, "total_steps": 333, "loss": 0.3545, "lr": 7.548034986908066e-07, "epoch": 2.8955642897248737, "percentage": 96.7, "elapsed_time": "1 day, 6:59:21", "remaining_time": "1:03:31"}
|
323 |
+
{"current_steps": 323, "total_steps": 333, "loss": 0.3583, "lr": 6.239250963192269e-07, "epoch": 2.904548006737788, "percentage": 97.0, "elapsed_time": "1 day, 7:05:04", "remaining_time": "0:57:44"}
|
324 |
+
{"current_steps": 324, "total_steps": 333, "loss": 0.3533, "lr": 5.054676883809827e-07, "epoch": 2.913531723750702, "percentage": 97.3, "elapsed_time": "1 day, 7:10:50", "remaining_time": "0:51:58"}
|
325 |
+
{"current_steps": 325, "total_steps": 333, "loss": 0.3627, "lr": 3.994443521011485e-07, "epoch": 2.922515440763616, "percentage": 97.6, "elapsed_time": "1 day, 7:16:30", "remaining_time": "0:46:11"}
|
326 |
+
{"current_steps": 326, "total_steps": 333, "loss": 0.348, "lr": 3.058667920329281e-07, "epoch": 2.93149915777653, "percentage": 97.9, "elapsed_time": "1 day, 7:22:22", "remaining_time": "0:40:25"}
|
327 |
+
{"current_steps": 327, "total_steps": 333, "loss": 0.3455, "lr": 2.2474533876546995e-07, "epoch": 2.9404828747894443, "percentage": 98.2, "elapsed_time": "1 day, 7:28:16", "remaining_time": "0:34:38"}
|
328 |
+
{"current_steps": 328, "total_steps": 333, "loss": 0.3579, "lr": 1.560889477834654e-07, "epoch": 2.9494665918023584, "percentage": 98.5, "elapsed_time": "1 day, 7:34:04", "remaining_time": "0:28:52"}
|
329 |
+
{"current_steps": 329, "total_steps": 333, "loss": 0.3528, "lr": 9.99051984784689e-08, "epoch": 2.958450308815272, "percentage": 98.8, "elapsed_time": "1 day, 7:39:54", "remaining_time": "0:23:05"}
|
330 |
+
{"current_steps": 330, "total_steps": 333, "loss": 0.3564, "lr": 5.620029331218986e-08, "epoch": 2.9674340258281866, "percentage": 99.1, "elapsed_time": "1 day, 7:45:29", "remaining_time": "0:17:19"}
|
331 |
+
{"current_steps": 331, "total_steps": 333, "loss": 0.3594, "lr": 2.4979057131732006e-08, "epoch": 2.9764177428411003, "percentage": 99.4, "elapsed_time": "1 day, 7:51:38", "remaining_time": "0:11:33"}
|
332 |
+
{"current_steps": 332, "total_steps": 333, "loss": 0.3521, "lr": 6.2449366369555176e-09, "epoch": 2.985401459854015, "percentage": 99.7, "elapsed_time": "1 day, 7:57:26", "remaining_time": "0:05:46"}
|
333 |
+
{"current_steps": 333, "total_steps": 333, "loss": 0.3558, "lr": 0.0, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 8:03:19", "remaining_time": "0:00:00"}
|
334 |
+
{"current_steps": 333, "total_steps": 333, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 8:04:52", "remaining_time": "0:00:00"}
|