Training in progress, step 639
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe6b7e9be412c0d1942d6b536fb3f1a839317705a8a032e77981103610aab249
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60f4821bb487cee638093f55f4ec7313392620383e6667433fdb19a1523d9916
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d801f1757f457de1bf8d595d699e0d767aec645e29a4f6ef310cd43cb14664ba
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfdb9f5877f652eda826277a2176d6e13834a4d027e648fa8bed3f1b60a71982
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -407,3 +407,234 @@
|
|
407 |
{"current_steps": 407, "total_steps": 639, "loss": 0.4813, "lr": 3.5069685373955442e-06, "epoch": 1.9107981220657277, "percentage": 63.69, "elapsed_time": "1:26:28", "remaining_time": "0:49:17"}
|
408 |
{"current_steps": 408, "total_steps": 639, "loss": 0.5376, "lr": 3.480919109504984e-06, "epoch": 1.915492957746479, "percentage": 63.85, "elapsed_time": "1:26:41", "remaining_time": "0:49:04"}
|
409 |
{"current_steps": 409, "total_steps": 639, "loss": 0.5424, "lr": 3.4549150281252635e-06, "epoch": 1.92018779342723, "percentage": 64.01, "elapsed_time": "1:26:53", "remaining_time": "0:48:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
407 |
{"current_steps": 407, "total_steps": 639, "loss": 0.4813, "lr": 3.5069685373955442e-06, "epoch": 1.9107981220657277, "percentage": 63.69, "elapsed_time": "1:26:28", "remaining_time": "0:49:17"}
|
408 |
{"current_steps": 408, "total_steps": 639, "loss": 0.5376, "lr": 3.480919109504984e-06, "epoch": 1.915492957746479, "percentage": 63.85, "elapsed_time": "1:26:41", "remaining_time": "0:49:04"}
|
409 |
{"current_steps": 409, "total_steps": 639, "loss": 0.5424, "lr": 3.4549150281252635e-06, "epoch": 1.92018779342723, "percentage": 64.01, "elapsed_time": "1:26:53", "remaining_time": "0:48:51"}
|
410 |
+
{"current_steps": 410, "total_steps": 639, "loss": 0.5585, "lr": 3.428957069511529e-06, "epoch": 1.9248826291079812, "percentage": 64.16, "elapsed_time": "1:27:05", "remaining_time": "0:48:38"}
|
411 |
+
{"current_steps": 411, "total_steps": 639, "loss": 0.5654, "lr": 3.4030460085421e-06, "epoch": 1.9295774647887325, "percentage": 64.32, "elapsed_time": "1:27:23", "remaining_time": "0:48:28"}
|
412 |
+
{"current_steps": 412, "total_steps": 639, "loss": 0.575, "lr": 3.3771826186953483e-06, "epoch": 1.9342723004694835, "percentage": 64.48, "elapsed_time": "1:27:33", "remaining_time": "0:48:14"}
|
413 |
+
{"current_steps": 413, "total_steps": 639, "loss": 0.5427, "lr": 3.3513676720265937e-06, "epoch": 1.9389671361502347, "percentage": 64.63, "elapsed_time": "1:27:46", "remaining_time": "0:48:01"}
|
414 |
+
{"current_steps": 414, "total_steps": 639, "loss": 0.5636, "lr": 3.3256019391450696e-06, "epoch": 1.943661971830986, "percentage": 64.79, "elapsed_time": "1:28:02", "remaining_time": "0:47:50"}
|
415 |
+
{"current_steps": 415, "total_steps": 639, "loss": 0.5498, "lr": 3.299886189190915e-06, "epoch": 1.948356807511737, "percentage": 64.95, "elapsed_time": "1:28:15", "remaining_time": "0:47:38"}
|
416 |
+
{"current_steps": 416, "total_steps": 639, "loss": 0.5556, "lr": 3.2742211898122123e-06, "epoch": 1.9530516431924883, "percentage": 65.1, "elapsed_time": "1:28:27", "remaining_time": "0:47:25"}
|
417 |
+
{"current_steps": 417, "total_steps": 639, "loss": 0.5339, "lr": 3.248607707142073e-06, "epoch": 1.9577464788732395, "percentage": 65.26, "elapsed_time": "1:28:38", "remaining_time": "0:47:11"}
|
418 |
+
{"current_steps": 418, "total_steps": 639, "loss": 0.5348, "lr": 3.2230465057757754e-06, "epoch": 1.9624413145539905, "percentage": 65.41, "elapsed_time": "1:28:48", "remaining_time": "0:46:57"}
|
419 |
+
{"current_steps": 419, "total_steps": 639, "loss": 0.579, "lr": 3.197538348747927e-06, "epoch": 1.9671361502347418, "percentage": 65.57, "elapsed_time": "1:29:02", "remaining_time": "0:46:45"}
|
420 |
+
{"current_steps": 420, "total_steps": 639, "loss": 0.5212, "lr": 3.1720839975096974e-06, "epoch": 1.971830985915493, "percentage": 65.73, "elapsed_time": "1:29:19", "remaining_time": "0:46:34"}
|
421 |
+
{"current_steps": 421, "total_steps": 639, "loss": 0.5536, "lr": 3.14668421190608e-06, "epoch": 1.976525821596244, "percentage": 65.88, "elapsed_time": "1:29:29", "remaining_time": "0:46:20"}
|
422 |
+
{"current_steps": 422, "total_steps": 639, "loss": 0.5324, "lr": 3.1213397501532216e-06, "epoch": 1.9812206572769953, "percentage": 66.04, "elapsed_time": "1:29:40", "remaining_time": "0:46:06"}
|
423 |
+
{"current_steps": 423, "total_steps": 639, "loss": 0.5047, "lr": 3.096051368815776e-06, "epoch": 1.9859154929577465, "percentage": 66.2, "elapsed_time": "1:29:49", "remaining_time": "0:45:52"}
|
424 |
+
{"current_steps": 424, "total_steps": 639, "loss": 0.534, "lr": 3.070819822784323e-06, "epoch": 1.9906103286384975, "percentage": 66.35, "elapsed_time": "1:30:02", "remaining_time": "0:45:39"}
|
425 |
+
{"current_steps": 425, "total_steps": 639, "loss": 0.5172, "lr": 3.045645865252842e-06, "epoch": 1.995305164319249, "percentage": 66.51, "elapsed_time": "1:30:16", "remaining_time": "0:45:27"}
|
426 |
+
{"current_steps": 426, "total_steps": 639, "loss": 0.5061, "lr": 3.0205302476962186e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:30:27", "remaining_time": "0:45:13"}
|
427 |
+
{"current_steps": 427, "total_steps": 639, "loss": 0.4319, "lr": 2.9954737198478122e-06, "epoch": 2.004694835680751, "percentage": 66.82, "elapsed_time": "1:30:37", "remaining_time": "0:44:59"}
|
428 |
+
{"current_steps": 428, "total_steps": 639, "loss": 0.4459, "lr": 2.9704770296770823e-06, "epoch": 2.0093896713615025, "percentage": 66.98, "elapsed_time": "1:30:47", "remaining_time": "0:44:45"}
|
429 |
+
{"current_steps": 429, "total_steps": 639, "loss": 0.4305, "lr": 2.9455409233672594e-06, "epoch": 2.0140845070422535, "percentage": 67.14, "elapsed_time": "1:30:59", "remaining_time": "0:44:32"}
|
430 |
+
{"current_steps": 430, "total_steps": 639, "loss": 0.4345, "lr": 2.920666145293063e-06, "epoch": 2.0187793427230045, "percentage": 67.29, "elapsed_time": "1:31:13", "remaining_time": "0:44:20"}
|
431 |
+
{"current_steps": 431, "total_steps": 639, "loss": 0.4315, "lr": 2.895853437998487e-06, "epoch": 2.023474178403756, "percentage": 67.45, "elapsed_time": "1:31:27", "remaining_time": "0:44:08"}
|
432 |
+
{"current_steps": 432, "total_steps": 639, "loss": 0.4592, "lr": 2.871103542174637e-06, "epoch": 2.028169014084507, "percentage": 67.61, "elapsed_time": "1:31:38", "remaining_time": "0:43:54"}
|
433 |
+
{"current_steps": 433, "total_steps": 639, "loss": 0.445, "lr": 2.846417196637613e-06, "epoch": 2.032863849765258, "percentage": 67.76, "elapsed_time": "1:31:49", "remaining_time": "0:43:41"}
|
434 |
+
{"current_steps": 434, "total_steps": 639, "loss": 0.4513, "lr": 2.8217951383064546e-06, "epoch": 2.0375586854460095, "percentage": 67.92, "elapsed_time": "1:32:04", "remaining_time": "0:43:29"}
|
435 |
+
{"current_steps": 435, "total_steps": 639, "loss": 0.4413, "lr": 2.7972381021811516e-06, "epoch": 2.0422535211267605, "percentage": 68.08, "elapsed_time": "1:32:18", "remaining_time": "0:43:17"}
|
436 |
+
{"current_steps": 436, "total_steps": 639, "loss": 0.4389, "lr": 2.7727468213206944e-06, "epoch": 2.0469483568075115, "percentage": 68.23, "elapsed_time": "1:32:29", "remaining_time": "0:43:03"}
|
437 |
+
{"current_steps": 437, "total_steps": 639, "loss": 0.4276, "lr": 2.748322026821197e-06, "epoch": 2.051643192488263, "percentage": 68.39, "elapsed_time": "1:32:39", "remaining_time": "0:42:49"}
|
438 |
+
{"current_steps": 438, "total_steps": 639, "loss": 0.4169, "lr": 2.723964447794064e-06, "epoch": 2.056338028169014, "percentage": 68.54, "elapsed_time": "1:32:51", "remaining_time": "0:42:36"}
|
439 |
+
{"current_steps": 439, "total_steps": 639, "loss": 0.4369, "lr": 2.6996748113442397e-06, "epoch": 2.0610328638497655, "percentage": 68.7, "elapsed_time": "1:33:04", "remaining_time": "0:42:24"}
|
440 |
+
{"current_steps": 440, "total_steps": 639, "loss": 0.4546, "lr": 2.6754538425484916e-06, "epoch": 2.0657276995305165, "percentage": 68.86, "elapsed_time": "1:33:16", "remaining_time": "0:42:11"}
|
441 |
+
{"current_steps": 441, "total_steps": 639, "loss": 0.4352, "lr": 2.651302264433772e-06, "epoch": 2.0704225352112675, "percentage": 69.01, "elapsed_time": "1:33:28", "remaining_time": "0:41:58"}
|
442 |
+
{"current_steps": 442, "total_steps": 639, "loss": 0.399, "lr": 2.6272207979556276e-06, "epoch": 2.075117370892019, "percentage": 69.17, "elapsed_time": "1:33:38", "remaining_time": "0:41:44"}
|
443 |
+
{"current_steps": 443, "total_steps": 639, "loss": 0.4397, "lr": 2.603210161976687e-06, "epoch": 2.07981220657277, "percentage": 69.33, "elapsed_time": "1:33:47", "remaining_time": "0:41:29"}
|
444 |
+
{"current_steps": 444, "total_steps": 639, "loss": 0.4241, "lr": 2.5792710732452e-06, "epoch": 2.084507042253521, "percentage": 69.48, "elapsed_time": "1:34:00", "remaining_time": "0:41:17"}
|
445 |
+
{"current_steps": 445, "total_steps": 639, "loss": 0.4446, "lr": 2.555404246373629e-06, "epoch": 2.0892018779342725, "percentage": 69.64, "elapsed_time": "1:34:16", "remaining_time": "0:41:05"}
|
446 |
+
{"current_steps": 446, "total_steps": 639, "loss": 0.4075, "lr": 2.531610393817343e-06, "epoch": 2.0938967136150235, "percentage": 69.8, "elapsed_time": "1:34:28", "remaining_time": "0:40:52"}
|
447 |
+
{"current_steps": 447, "total_steps": 639, "loss": 0.4292, "lr": 2.5078902258533206e-06, "epoch": 2.0985915492957745, "percentage": 69.95, "elapsed_time": "1:34:39", "remaining_time": "0:40:39"}
|
448 |
+
{"current_steps": 448, "total_steps": 639, "loss": 0.4446, "lr": 2.4842444505589667e-06, "epoch": 2.103286384976526, "percentage": 70.11, "elapsed_time": "1:34:50", "remaining_time": "0:40:26"}
|
449 |
+
{"current_steps": 449, "total_steps": 639, "loss": 0.4168, "lr": 2.4606737737909696e-06, "epoch": 2.107981220657277, "percentage": 70.27, "elapsed_time": "1:35:00", "remaining_time": "0:40:12"}
|
450 |
+
{"current_steps": 450, "total_steps": 639, "loss": 0.479, "lr": 2.437178899164232e-06, "epoch": 2.112676056338028, "percentage": 70.42, "elapsed_time": "1:35:13", "remaining_time": "0:39:59"}
|
451 |
+
{"current_steps": 451, "total_steps": 639, "loss": 0.433, "lr": 2.4137605280308583e-06, "epoch": 2.1173708920187795, "percentage": 70.58, "elapsed_time": "1:35:27", "remaining_time": "0:39:47"}
|
452 |
+
{"current_steps": 452, "total_steps": 639, "loss": 0.4366, "lr": 2.3904193594592334e-06, "epoch": 2.1220657276995305, "percentage": 70.74, "elapsed_time": "1:35:42", "remaining_time": "0:39:35"}
|
453 |
+
{"current_steps": 453, "total_steps": 639, "loss": 0.4598, "lr": 2.3671560902131445e-06, "epoch": 2.1267605633802815, "percentage": 70.89, "elapsed_time": "1:35:53", "remaining_time": "0:39:22"}
|
454 |
+
{"current_steps": 454, "total_steps": 639, "loss": 0.4234, "lr": 2.3439714147309845e-06, "epoch": 2.131455399061033, "percentage": 71.05, "elapsed_time": "1:36:04", "remaining_time": "0:39:09"}
|
455 |
+
{"current_steps": 455, "total_steps": 639, "loss": 0.4511, "lr": 2.320866025105016e-06, "epoch": 2.136150234741784, "percentage": 71.21, "elapsed_time": "1:36:19", "remaining_time": "0:38:57"}
|
456 |
+
{"current_steps": 456, "total_steps": 639, "loss": 0.456, "lr": 2.297840611060729e-06, "epoch": 2.140845070422535, "percentage": 71.36, "elapsed_time": "1:36:30", "remaining_time": "0:38:43"}
|
457 |
+
{"current_steps": 457, "total_steps": 639, "loss": 0.4226, "lr": 2.274895859936229e-06, "epoch": 2.1455399061032865, "percentage": 71.52, "elapsed_time": "1:36:42", "remaining_time": "0:38:30"}
|
458 |
+
{"current_steps": 458, "total_steps": 639, "loss": 0.4369, "lr": 2.252032456661736e-06, "epoch": 2.1502347417840375, "percentage": 71.67, "elapsed_time": "1:36:54", "remaining_time": "0:38:17"}
|
459 |
+
{"current_steps": 459, "total_steps": 639, "loss": 0.4357, "lr": 2.229251083739127e-06, "epoch": 2.1549295774647885, "percentage": 71.83, "elapsed_time": "1:37:03", "remaining_time": "0:38:03"}
|
460 |
+
{"current_steps": 460, "total_steps": 639, "loss": 0.4273, "lr": 2.2065524212215744e-06, "epoch": 2.15962441314554, "percentage": 71.99, "elapsed_time": "1:37:16", "remaining_time": "0:37:51"}
|
461 |
+
{"current_steps": 461, "total_steps": 639, "loss": 0.4608, "lr": 2.1839371466932353e-06, "epoch": 2.164319248826291, "percentage": 72.14, "elapsed_time": "1:37:30", "remaining_time": "0:37:38"}
|
462 |
+
{"current_steps": 462, "total_steps": 639, "loss": 0.4546, "lr": 2.161405935249029e-06, "epoch": 2.169014084507042, "percentage": 72.3, "elapsed_time": "1:37:40", "remaining_time": "0:37:25"}
|
463 |
+
{"current_steps": 463, "total_steps": 639, "loss": 0.4517, "lr": 2.138959459474487e-06, "epoch": 2.1737089201877935, "percentage": 72.46, "elapsed_time": "1:37:56", "remaining_time": "0:37:13"}
|
464 |
+
{"current_steps": 464, "total_steps": 639, "loss": 0.4452, "lr": 2.1165983894256647e-06, "epoch": 2.1784037558685445, "percentage": 72.61, "elapsed_time": "1:38:09", "remaining_time": "0:37:01"}
|
465 |
+
{"current_steps": 465, "total_steps": 639, "loss": 0.4554, "lr": 2.094323392609158e-06, "epoch": 2.183098591549296, "percentage": 72.77, "elapsed_time": "1:38:23", "remaining_time": "0:36:49"}
|
466 |
+
{"current_steps": 466, "total_steps": 639, "loss": 0.449, "lr": 2.072135133962153e-06, "epoch": 2.187793427230047, "percentage": 72.93, "elapsed_time": "1:38:36", "remaining_time": "0:36:36"}
|
467 |
+
{"current_steps": 467, "total_steps": 639, "loss": 0.428, "lr": 2.050034275832607e-06, "epoch": 2.192488262910798, "percentage": 73.08, "elapsed_time": "1:38:46", "remaining_time": "0:36:22"}
|
468 |
+
{"current_steps": 468, "total_steps": 639, "loss": 0.4421, "lr": 2.028021477959445e-06, "epoch": 2.1971830985915495, "percentage": 73.24, "elapsed_time": "1:38:59", "remaining_time": "0:36:10"}
|
469 |
+
{"current_steps": 469, "total_steps": 639, "loss": 0.4318, "lr": 2.0060973974528873e-06, "epoch": 2.2018779342723005, "percentage": 73.4, "elapsed_time": "1:39:11", "remaining_time": "0:35:57"}
|
470 |
+
{"current_steps": 470, "total_steps": 639, "loss": 0.4329, "lr": 1.9842626887748284e-06, "epoch": 2.2065727699530515, "percentage": 73.55, "elapsed_time": "1:39:24", "remaining_time": "0:35:44"}
|
471 |
+
{"current_steps": 471, "total_steps": 639, "loss": 0.4237, "lr": 1.962518003719297e-06, "epoch": 2.211267605633803, "percentage": 73.71, "elapsed_time": "1:39:39", "remaining_time": "0:35:32"}
|
472 |
+
{"current_steps": 472, "total_steps": 639, "loss": 0.4468, "lr": 1.9408639913929994e-06, "epoch": 2.215962441314554, "percentage": 73.87, "elapsed_time": "1:39:49", "remaining_time": "0:35:19"}
|
473 |
+
{"current_steps": 473, "total_steps": 639, "loss": 0.4446, "lr": 1.9193012981959473e-06, "epoch": 2.220657276995305, "percentage": 74.02, "elapsed_time": "1:40:00", "remaining_time": "0:35:05"}
|
474 |
+
{"current_steps": 474, "total_steps": 639, "loss": 0.4454, "lr": 1.8978305678021598e-06, "epoch": 2.2253521126760565, "percentage": 74.18, "elapsed_time": "1:40:11", "remaining_time": "0:34:52"}
|
475 |
+
{"current_steps": 475, "total_steps": 639, "loss": 0.4305, "lr": 1.8764524411404494e-06, "epoch": 2.2300469483568075, "percentage": 74.33, "elapsed_time": "1:40:24", "remaining_time": "0:34:40"}
|
476 |
+
{"current_steps": 476, "total_steps": 639, "loss": 0.4342, "lr": 1.8551675563752808e-06, "epoch": 2.2347417840375585, "percentage": 74.49, "elapsed_time": "1:40:37", "remaining_time": "0:34:27"}
|
477 |
+
{"current_steps": 477, "total_steps": 639, "loss": 0.4324, "lr": 1.833976548887742e-06, "epoch": 2.23943661971831, "percentage": 74.65, "elapsed_time": "1:40:47", "remaining_time": "0:34:13"}
|
478 |
+
{"current_steps": 478, "total_steps": 639, "loss": 0.4432, "lr": 1.8128800512565514e-06, "epoch": 2.244131455399061, "percentage": 74.8, "elapsed_time": "1:40:56", "remaining_time": "0:34:00"}
|
479 |
+
{"current_steps": 479, "total_steps": 639, "loss": 0.4199, "lr": 1.7918786932391945e-06, "epoch": 2.248826291079812, "percentage": 74.96, "elapsed_time": "1:41:07", "remaining_time": "0:33:46"}
|
480 |
+
{"current_steps": 480, "total_steps": 639, "loss": 0.4295, "lr": 1.7709731017531156e-06, "epoch": 2.2535211267605635, "percentage": 75.12, "elapsed_time": "1:41:20", "remaining_time": "0:33:34"}
|
481 |
+
{"current_steps": 481, "total_steps": 639, "loss": 0.4337, "lr": 1.750163900857003e-06, "epoch": 2.2582159624413145, "percentage": 75.27, "elapsed_time": "1:41:33", "remaining_time": "0:33:21"}
|
482 |
+
{"current_steps": 482, "total_steps": 639, "loss": 0.4287, "lr": 1.7294517117321657e-06, "epoch": 2.262910798122066, "percentage": 75.43, "elapsed_time": "1:41:43", "remaining_time": "0:33:08"}
|
483 |
+
{"current_steps": 483, "total_steps": 639, "loss": 0.4477, "lr": 1.7088371526639852e-06, "epoch": 2.267605633802817, "percentage": 75.59, "elapsed_time": "1:41:56", "remaining_time": "0:32:55"}
|
484 |
+
{"current_steps": 484, "total_steps": 639, "loss": 0.4242, "lr": 1.688320839023463e-06, "epoch": 2.272300469483568, "percentage": 75.74, "elapsed_time": "1:42:06", "remaining_time": "0:32:42"}
|
485 |
+
{"current_steps": 485, "total_steps": 639, "loss": 0.4346, "lr": 1.6679033832488433e-06, "epoch": 2.276995305164319, "percentage": 75.9, "elapsed_time": "1:42:19", "remaining_time": "0:32:29"}
|
486 |
+
{"current_steps": 486, "total_steps": 639, "loss": 0.4444, "lr": 1.6475853948273429e-06, "epoch": 2.2816901408450705, "percentage": 76.06, "elapsed_time": "1:42:31", "remaining_time": "0:32:16"}
|
487 |
+
{"current_steps": 487, "total_steps": 639, "loss": 0.4273, "lr": 1.6273674802769468e-06, "epoch": 2.2863849765258215, "percentage": 76.21, "elapsed_time": "1:42:42", "remaining_time": "0:32:03"}
|
488 |
+
{"current_steps": 488, "total_steps": 639, "loss": 0.399, "lr": 1.6072502431283093e-06, "epoch": 2.291079812206573, "percentage": 76.37, "elapsed_time": "1:42:53", "remaining_time": "0:31:50"}
|
489 |
+
{"current_steps": 489, "total_steps": 639, "loss": 0.4243, "lr": 1.5872342839067305e-06, "epoch": 2.295774647887324, "percentage": 76.53, "elapsed_time": "1:43:05", "remaining_time": "0:31:37"}
|
490 |
+
{"current_steps": 490, "total_steps": 639, "loss": 0.4583, "lr": 1.5673202001142396e-06, "epoch": 2.300469483568075, "percentage": 76.68, "elapsed_time": "1:43:17", "remaining_time": "0:31:24"}
|
491 |
+
{"current_steps": 491, "total_steps": 639, "loss": 0.431, "lr": 1.547508586211751e-06, "epoch": 2.3051643192488265, "percentage": 76.84, "elapsed_time": "1:43:31", "remaining_time": "0:31:12"}
|
492 |
+
{"current_steps": 492, "total_steps": 639, "loss": 0.4198, "lr": 1.527800033601326e-06, "epoch": 2.3098591549295775, "percentage": 77.0, "elapsed_time": "1:43:45", "remaining_time": "0:31:00"}
|
493 |
+
{"current_steps": 493, "total_steps": 639, "loss": 0.4341, "lr": 1.5081951306085042e-06, "epoch": 2.3145539906103285, "percentage": 77.15, "elapsed_time": "1:43:53", "remaining_time": "0:30:46"}
|
494 |
+
{"current_steps": 494, "total_steps": 639, "loss": 0.4465, "lr": 1.4886944624647647e-06, "epoch": 2.31924882629108, "percentage": 77.31, "elapsed_time": "1:44:02", "remaining_time": "0:30:32"}
|
495 |
+
{"current_steps": 495, "total_steps": 639, "loss": 0.4188, "lr": 1.4692986112900315e-06, "epoch": 2.323943661971831, "percentage": 77.46, "elapsed_time": "1:44:12", "remaining_time": "0:30:19"}
|
496 |
+
{"current_steps": 496, "total_steps": 639, "loss": 0.4557, "lr": 1.4500081560753154e-06, "epoch": 2.328638497652582, "percentage": 77.62, "elapsed_time": "1:44:25", "remaining_time": "0:30:06"}
|
497 |
+
{"current_steps": 497, "total_steps": 639, "loss": 0.4304, "lr": 1.4308236726654151e-06, "epoch": 2.3333333333333335, "percentage": 77.78, "elapsed_time": "1:44:42", "remaining_time": "0:29:55"}
|
498 |
+
{"current_steps": 498, "total_steps": 639, "loss": 0.4382, "lr": 1.4117457337417456e-06, "epoch": 2.3380281690140845, "percentage": 77.93, "elapsed_time": "1:44:51", "remaining_time": "0:29:41"}
|
499 |
+
{"current_steps": 499, "total_steps": 639, "loss": 0.4428, "lr": 1.3927749088052218e-06, "epoch": 2.3427230046948355, "percentage": 78.09, "elapsed_time": "1:45:02", "remaining_time": "0:29:28"}
|
500 |
+
{"current_steps": 500, "total_steps": 639, "loss": 0.4599, "lr": 1.3739117641592752e-06, "epoch": 2.347417840375587, "percentage": 78.25, "elapsed_time": "1:45:15", "remaining_time": "0:29:15"}
|
501 |
+
{"current_steps": 501, "total_steps": 639, "loss": 0.4293, "lr": 1.3551568628929434e-06, "epoch": 2.352112676056338, "percentage": 78.4, "elapsed_time": "1:45:30", "remaining_time": "0:29:03"}
|
502 |
+
{"current_steps": 502, "total_steps": 639, "loss": 0.4311, "lr": 1.336510764864054e-06, "epoch": 2.356807511737089, "percentage": 78.56, "elapsed_time": "1:45:45", "remaining_time": "0:28:51"}
|
503 |
+
{"current_steps": 503, "total_steps": 639, "loss": 0.4217, "lr": 1.3179740266825253e-06, "epoch": 2.3615023474178405, "percentage": 78.72, "elapsed_time": "1:45:56", "remaining_time": "0:28:38"}
|
504 |
+
{"current_steps": 504, "total_steps": 639, "loss": 0.4272, "lr": 1.2995472016937405e-06, "epoch": 2.3661971830985915, "percentage": 78.87, "elapsed_time": "1:46:06", "remaining_time": "0:28:25"}
|
505 |
+
{"current_steps": 505, "total_steps": 639, "loss": 0.4732, "lr": 1.281230839962036e-06, "epoch": 2.370892018779343, "percentage": 79.03, "elapsed_time": "1:46:20", "remaining_time": "0:28:12"}
|
506 |
+
{"current_steps": 506, "total_steps": 639, "loss": 0.4294, "lr": 1.2630254882542737e-06, "epoch": 2.375586854460094, "percentage": 79.19, "elapsed_time": "1:46:33", "remaining_time": "0:28:00"}
|
507 |
+
{"current_steps": 507, "total_steps": 639, "loss": 0.416, "lr": 1.2449316900235275e-06, "epoch": 2.380281690140845, "percentage": 79.34, "elapsed_time": "1:46:47", "remaining_time": "0:27:48"}
|
508 |
+
{"current_steps": 508, "total_steps": 639, "loss": 0.4169, "lr": 1.226949985392858e-06, "epoch": 2.384976525821596, "percentage": 79.5, "elapsed_time": "1:47:03", "remaining_time": "0:27:36"}
|
509 |
+
{"current_steps": 509, "total_steps": 639, "loss": 0.4556, "lr": 1.209080911139187e-06, "epoch": 2.3896713615023475, "percentage": 79.66, "elapsed_time": "1:47:14", "remaining_time": "0:27:23"}
|
510 |
+
{"current_steps": 510, "total_steps": 639, "loss": 0.4297, "lr": 1.1913250006772714e-06, "epoch": 2.3943661971830985, "percentage": 79.81, "elapsed_time": "1:47:27", "remaining_time": "0:27:10"}
|
511 |
+
{"current_steps": 511, "total_steps": 639, "loss": 0.4398, "lr": 1.1736827840437932e-06, "epoch": 2.39906103286385, "percentage": 79.97, "elapsed_time": "1:47:39", "remaining_time": "0:26:58"}
|
512 |
+
{"current_steps": 512, "total_steps": 639, "loss": 0.4494, "lr": 1.1561547878815172e-06, "epoch": 2.403755868544601, "percentage": 80.13, "elapsed_time": "1:47:51", "remaining_time": "0:26:45"}
|
513 |
+
{"current_steps": 513, "total_steps": 639, "loss": 0.4445, "lr": 1.1387415354235887e-06, "epoch": 2.408450704225352, "percentage": 80.28, "elapsed_time": "1:48:01", "remaining_time": "0:26:32"}
|
514 |
+
{"current_steps": 514, "total_steps": 639, "loss": 0.4449, "lr": 1.1214435464779006e-06, "epoch": 2.4131455399061035, "percentage": 80.44, "elapsed_time": "1:48:13", "remaining_time": "0:26:19"}
|
515 |
+
{"current_steps": 515, "total_steps": 639, "loss": 0.4597, "lr": 1.1042613374115896e-06, "epoch": 2.4178403755868545, "percentage": 80.59, "elapsed_time": "1:48:26", "remaining_time": "0:26:06"}
|
516 |
+
{"current_steps": 516, "total_steps": 639, "loss": 0.4549, "lr": 1.0871954211356068e-06, "epoch": 2.4225352112676055, "percentage": 80.75, "elapsed_time": "1:48:39", "remaining_time": "0:25:54"}
|
517 |
+
{"current_steps": 517, "total_steps": 639, "loss": 0.4342, "lr": 1.0702463070894192e-06, "epoch": 2.427230046948357, "percentage": 80.91, "elapsed_time": "1:48:53", "remaining_time": "0:25:41"}
|
518 |
+
{"current_steps": 518, "total_steps": 639, "loss": 0.4478, "lr": 1.0534145012257962e-06, "epoch": 2.431924882629108, "percentage": 81.06, "elapsed_time": "1:49:07", "remaining_time": "0:25:29"}
|
519 |
+
{"current_steps": 519, "total_steps": 639, "loss": 0.4344, "lr": 1.0367005059957097e-06, "epoch": 2.436619718309859, "percentage": 81.22, "elapsed_time": "1:49:22", "remaining_time": "0:25:17"}
|
520 |
+
{"current_steps": 520, "total_steps": 639, "loss": 0.4316, "lr": 1.0201048203333281e-06, "epoch": 2.4413145539906105, "percentage": 81.38, "elapsed_time": "1:49:35", "remaining_time": "0:25:04"}
|
521 |
+
{"current_steps": 521, "total_steps": 639, "loss": 0.4593, "lr": 1.003627939641133e-06, "epoch": 2.4460093896713615, "percentage": 81.53, "elapsed_time": "1:49:48", "remaining_time": "0:24:52"}
|
522 |
+
{"current_steps": 522, "total_steps": 639, "loss": 0.4367, "lr": 9.87270355775124e-07, "epoch": 2.4507042253521125, "percentage": 81.69, "elapsed_time": "1:50:00", "remaining_time": "0:24:39"}
|
523 |
+
{"current_steps": 523, "total_steps": 639, "loss": 0.4335, "lr": 9.710325570301348e-07, "epoch": 2.455399061032864, "percentage": 81.85, "elapsed_time": "1:50:12", "remaining_time": "0:24:26"}
|
524 |
+
{"current_steps": 524, "total_steps": 639, "loss": 0.4536, "lr": 9.549150281252633e-07, "epoch": 2.460093896713615, "percentage": 82.0, "elapsed_time": "1:50:21", "remaining_time": "0:24:13"}
|
525 |
+
{"current_steps": 525, "total_steps": 639, "loss": 0.4571, "lr": 9.389182501893967e-07, "epoch": 2.464788732394366, "percentage": 82.16, "elapsed_time": "1:50:38", "remaining_time": "0:24:01"}
|
526 |
+
{"current_steps": 526, "total_steps": 639, "loss": 0.4395, "lr": 9.230427007468534e-07, "epoch": 2.4694835680751175, "percentage": 82.32, "elapsed_time": "1:50:52", "remaining_time": "0:23:49"}
|
527 |
+
{"current_steps": 527, "total_steps": 639, "loss": 0.4159, "lr": 9.072888537031216e-07, "epoch": 2.4741784037558685, "percentage": 82.47, "elapsed_time": "1:51:04", "remaining_time": "0:23:36"}
|
528 |
+
{"current_steps": 528, "total_steps": 639, "loss": 0.4016, "lr": 8.916571793307205e-07, "epoch": 2.4788732394366195, "percentage": 82.63, "elapsed_time": "1:51:13", "remaining_time": "0:23:22"}
|
529 |
+
{"current_steps": 529, "total_steps": 639, "loss": 0.4293, "lr": 8.761481442551573e-07, "epoch": 2.483568075117371, "percentage": 82.79, "elapsed_time": "1:51:26", "remaining_time": "0:23:10"}
|
530 |
+
{"current_steps": 530, "total_steps": 639, "loss": 0.4228, "lr": 8.607622114410014e-07, "epoch": 2.488262910798122, "percentage": 82.94, "elapsed_time": "1:51:39", "remaining_time": "0:22:57"}
|
531 |
+
{"current_steps": 531, "total_steps": 639, "loss": 0.4045, "lr": 8.454998401780551e-07, "epoch": 2.492957746478873, "percentage": 83.1, "elapsed_time": "1:51:51", "remaining_time": "0:22:45"}
|
532 |
+
{"current_steps": 532, "total_steps": 639, "loss": 0.4193, "lr": 8.303614860676601e-07, "epoch": 2.4976525821596245, "percentage": 83.26, "elapsed_time": "1:52:01", "remaining_time": "0:22:31"}
|
533 |
+
{"current_steps": 533, "total_steps": 639, "loss": 0.4271, "lr": 8.153476010090789e-07, "epoch": 2.5023474178403755, "percentage": 83.41, "elapsed_time": "1:52:13", "remaining_time": "0:22:19"}
|
534 |
+
{"current_steps": 534, "total_steps": 639, "loss": 0.4432, "lr": 8.004586331860176e-07, "epoch": 2.507042253521127, "percentage": 83.57, "elapsed_time": "1:52:29", "remaining_time": "0:22:07"}
|
535 |
+
{"current_steps": 535, "total_steps": 639, "loss": 0.4361, "lr": 7.85695027053241e-07, "epoch": 2.511737089201878, "percentage": 83.72, "elapsed_time": "1:52:42", "remaining_time": "0:21:54"}
|
536 |
+
{"current_steps": 536, "total_steps": 639, "loss": 0.4343, "lr": 7.710572233233082e-07, "epoch": 2.516431924882629, "percentage": 83.88, "elapsed_time": "1:52:54", "remaining_time": "0:21:41"}
|
537 |
+
{"current_steps": 537, "total_steps": 639, "loss": 0.4263, "lr": 7.565456589534137e-07, "epoch": 2.52112676056338, "percentage": 84.04, "elapsed_time": "1:53:07", "remaining_time": "0:21:29"}
|
538 |
+
{"current_steps": 538, "total_steps": 639, "loss": 0.4506, "lr": 7.421607671323461e-07, "epoch": 2.5258215962441315, "percentage": 84.19, "elapsed_time": "1:53:19", "remaining_time": "0:21:16"}
|
539 |
+
{"current_steps": 539, "total_steps": 639, "loss": 0.4366, "lr": 7.279029772675572e-07, "epoch": 2.5305164319248825, "percentage": 84.35, "elapsed_time": "1:53:35", "remaining_time": "0:21:04"}
|
540 |
+
{"current_steps": 540, "total_steps": 639, "loss": 0.4536, "lr": 7.137727149723417e-07, "epoch": 2.535211267605634, "percentage": 84.51, "elapsed_time": "1:53:47", "remaining_time": "0:20:51"}
|
541 |
+
{"current_steps": 541, "total_steps": 639, "loss": 0.4108, "lr": 6.997704020531321e-07, "epoch": 2.539906103286385, "percentage": 84.66, "elapsed_time": "1:53:57", "remaining_time": "0:20:38"}
|
542 |
+
{"current_steps": 542, "total_steps": 639, "loss": 0.4529, "lr": 6.858964564969089e-07, "epoch": 2.544600938967136, "percentage": 84.82, "elapsed_time": "1:54:09", "remaining_time": "0:20:25"}
|
543 |
+
{"current_steps": 543, "total_steps": 639, "loss": 0.4548, "lr": 6.721512924587243e-07, "epoch": 2.5492957746478875, "percentage": 84.98, "elapsed_time": "1:54:19", "remaining_time": "0:20:12"}
|
544 |
+
{"current_steps": 544, "total_steps": 639, "loss": 0.4333, "lr": 6.585353202493322e-07, "epoch": 2.5539906103286385, "percentage": 85.13, "elapsed_time": "1:54:37", "remaining_time": "0:20:01"}
|
545 |
+
{"current_steps": 545, "total_steps": 639, "loss": 0.4294, "lr": 6.450489463229493e-07, "epoch": 2.5586854460093895, "percentage": 85.29, "elapsed_time": "1:54:49", "remaining_time": "0:19:48"}
|
546 |
+
{"current_steps": 546, "total_steps": 639, "loss": 0.4281, "lr": 6.31692573265117e-07, "epoch": 2.563380281690141, "percentage": 85.45, "elapsed_time": "1:55:00", "remaining_time": "0:19:35"}
|
547 |
+
{"current_steps": 547, "total_steps": 639, "loss": 0.4418, "lr": 6.184665997806832e-07, "epoch": 2.568075117370892, "percentage": 85.6, "elapsed_time": "1:55:16", "remaining_time": "0:19:23"}
|
548 |
+
{"current_steps": 548, "total_steps": 639, "loss": 0.4189, "lr": 6.053714206818989e-07, "epoch": 2.572769953051643, "percentage": 85.76, "elapsed_time": "1:55:24", "remaining_time": "0:19:09"}
|
549 |
+
{"current_steps": 549, "total_steps": 639, "loss": 0.4143, "lr": 5.924074268766422e-07, "epoch": 2.5774647887323945, "percentage": 85.92, "elapsed_time": "1:55:36", "remaining_time": "0:18:57"}
|
550 |
+
{"current_steps": 550, "total_steps": 639, "loss": 0.4357, "lr": 5.79575005356735e-07, "epoch": 2.5821596244131455, "percentage": 86.07, "elapsed_time": "1:55:49", "remaining_time": "0:18:44"}
|
551 |
+
{"current_steps": 551, "total_steps": 639, "loss": 0.4203, "lr": 5.668745391864017e-07, "epoch": 2.586854460093897, "percentage": 86.23, "elapsed_time": "1:56:01", "remaining_time": "0:18:31"}
|
552 |
+
{"current_steps": 552, "total_steps": 639, "loss": 0.4242, "lr": 5.543064074908272e-07, "epoch": 2.591549295774648, "percentage": 86.38, "elapsed_time": "1:56:11", "remaining_time": "0:18:18"}
|
553 |
+
{"current_steps": 553, "total_steps": 639, "loss": 0.4491, "lr": 5.418709854448489e-07, "epoch": 2.596244131455399, "percentage": 86.54, "elapsed_time": "1:56:21", "remaining_time": "0:18:05"}
|
554 |
+
{"current_steps": 554, "total_steps": 639, "loss": 0.415, "lr": 5.295686442617442e-07, "epoch": 2.60093896713615, "percentage": 86.7, "elapsed_time": "1:56:35", "remaining_time": "0:17:53"}
|
555 |
+
{"current_steps": 555, "total_steps": 639, "loss": 0.441, "lr": 5.173997511821599e-07, "epoch": 2.6056338028169015, "percentage": 86.85, "elapsed_time": "1:56:47", "remaining_time": "0:17:40"}
|
556 |
+
{"current_steps": 556, "total_steps": 639, "loss": 0.4352, "lr": 5.053646694631459e-07, "epoch": 2.6103286384976525, "percentage": 87.01, "elapsed_time": "1:56:59", "remaining_time": "0:17:27"}
|
557 |
+
{"current_steps": 557, "total_steps": 639, "loss": 0.4348, "lr": 4.934637583673119e-07, "epoch": 2.615023474178404, "percentage": 87.17, "elapsed_time": "1:57:13", "remaining_time": "0:17:15"}
|
558 |
+
{"current_steps": 558, "total_steps": 639, "loss": 0.4687, "lr": 4.81697373152099e-07, "epoch": 2.619718309859155, "percentage": 87.32, "elapsed_time": "1:57:24", "remaining_time": "0:17:02"}
|
559 |
+
{"current_steps": 559, "total_steps": 639, "loss": 0.4372, "lr": 4.7006586505918273e-07, "epoch": 2.624413145539906, "percentage": 87.48, "elapsed_time": "1:57:41", "remaining_time": "0:16:50"}
|
560 |
+
{"current_steps": 560, "total_steps": 639, "loss": 0.454, "lr": 4.5856958130398146e-07, "epoch": 2.629107981220657, "percentage": 87.64, "elapsed_time": "1:57:55", "remaining_time": "0:16:38"}
|
561 |
+
{"current_steps": 561, "total_steps": 639, "loss": 0.4322, "lr": 4.472088650652956e-07, "epoch": 2.6338028169014085, "percentage": 87.79, "elapsed_time": "1:58:06", "remaining_time": "0:16:25"}
|
562 |
+
{"current_steps": 562, "total_steps": 639, "loss": 0.4285, "lr": 4.3598405547505886e-07, "epoch": 2.6384976525821595, "percentage": 87.95, "elapsed_time": "1:58:18", "remaining_time": "0:16:12"}
|
563 |
+
{"current_steps": 563, "total_steps": 639, "loss": 0.4502, "lr": 4.248954876082195e-07, "epoch": 2.643192488262911, "percentage": 88.11, "elapsed_time": "1:58:27", "remaining_time": "0:15:59"}
|
564 |
+
{"current_steps": 564, "total_steps": 639, "loss": 0.4368, "lr": 4.139434924727359e-07, "epoch": 2.647887323943662, "percentage": 88.26, "elapsed_time": "1:58:42", "remaining_time": "0:15:47"}
|
565 |
+
{"current_steps": 565, "total_steps": 639, "loss": 0.4492, "lr": 4.031283969996919e-07, "epoch": 2.652582159624413, "percentage": 88.42, "elapsed_time": "1:59:01", "remaining_time": "0:15:35"}
|
566 |
+
{"current_steps": 566, "total_steps": 639, "loss": 0.4581, "lr": 3.924505240335469e-07, "epoch": 2.6572769953051645, "percentage": 88.58, "elapsed_time": "1:59:11", "remaining_time": "0:15:22"}
|
567 |
+
{"current_steps": 567, "total_steps": 639, "loss": 0.4373, "lr": 3.819101923224877e-07, "epoch": 2.6619718309859155, "percentage": 88.73, "elapsed_time": "1:59:23", "remaining_time": "0:15:09"}
|
568 |
+
{"current_steps": 568, "total_steps": 639, "loss": 0.4371, "lr": 3.71507716508922e-07, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "1:59:35", "remaining_time": "0:14:56"}
|
569 |
+
{"current_steps": 569, "total_steps": 639, "loss": 0.4512, "lr": 3.612434071200771e-07, "epoch": 2.671361502347418, "percentage": 89.05, "elapsed_time": "1:59:50", "remaining_time": "0:14:44"}
|
570 |
+
{"current_steps": 570, "total_steps": 639, "loss": 0.4255, "lr": 3.511175705587433e-07, "epoch": 2.676056338028169, "percentage": 89.2, "elapsed_time": "2:00:05", "remaining_time": "0:14:32"}
|
571 |
+
{"current_steps": 571, "total_steps": 639, "loss": 0.401, "lr": 3.411305090941125e-07, "epoch": 2.68075117370892, "percentage": 89.36, "elapsed_time": "2:00:14", "remaining_time": "0:14:19"}
|
572 |
+
{"current_steps": 572, "total_steps": 639, "loss": 0.4547, "lr": 3.312825208527648e-07, "epoch": 2.6854460093896715, "percentage": 89.51, "elapsed_time": "2:00:28", "remaining_time": "0:14:06"}
|
573 |
+
{"current_steps": 573, "total_steps": 639, "loss": 0.431, "lr": 3.2157389980976783e-07, "epoch": 2.6901408450704225, "percentage": 89.67, "elapsed_time": "2:00:42", "remaining_time": "0:13:54"}
|
574 |
+
{"current_steps": 574, "total_steps": 639, "loss": 0.4217, "lr": 3.1200493577989875e-07, "epoch": 2.694835680751174, "percentage": 89.83, "elapsed_time": "2:00:56", "remaining_time": "0:13:41"}
|
575 |
+
{"current_steps": 575, "total_steps": 639, "loss": 0.4405, "lr": 3.0257591440899235e-07, "epoch": 2.699530516431925, "percentage": 89.98, "elapsed_time": "2:01:08", "remaining_time": "0:13:29"}
|
576 |
+
{"current_steps": 576, "total_steps": 639, "loss": 0.4137, "lr": 2.9328711716541725e-07, "epoch": 2.704225352112676, "percentage": 90.14, "elapsed_time": "2:01:17", "remaining_time": "0:13:15"}
|
577 |
+
{"current_steps": 577, "total_steps": 639, "loss": 0.4294, "lr": 2.841388213316726e-07, "epoch": 2.708920187793427, "percentage": 90.3, "elapsed_time": "2:01:28", "remaining_time": "0:13:03"}
|
578 |
+
{"current_steps": 578, "total_steps": 639, "loss": 0.4212, "lr": 2.751312999961103e-07, "epoch": 2.7136150234741785, "percentage": 90.45, "elapsed_time": "2:01:41", "remaining_time": "0:12:50"}
|
579 |
+
{"current_steps": 579, "total_steps": 639, "loss": 0.4298, "lr": 2.662648220447811e-07, "epoch": 2.7183098591549295, "percentage": 90.61, "elapsed_time": "2:01:55", "remaining_time": "0:12:38"}
|
580 |
+
{"current_steps": 580, "total_steps": 639, "loss": 0.4351, "lr": 2.5753965215341347e-07, "epoch": 2.723004694835681, "percentage": 90.77, "elapsed_time": "2:02:09", "remaining_time": "0:12:25"}
|
581 |
+
{"current_steps": 581, "total_steps": 639, "loss": 0.4404, "lr": 2.489560507795069e-07, "epoch": 2.727699530516432, "percentage": 90.92, "elapsed_time": "2:02:20", "remaining_time": "0:12:12"}
|
582 |
+
{"current_steps": 582, "total_steps": 639, "loss": 0.4344, "lr": 2.405142741545591e-07, "epoch": 2.732394366197183, "percentage": 91.08, "elapsed_time": "2:02:31", "remaining_time": "0:11:59"}
|
583 |
+
{"current_steps": 583, "total_steps": 639, "loss": 0.4234, "lr": 2.3221457427641815e-07, "epoch": 2.737089201877934, "percentage": 91.24, "elapsed_time": "2:02:42", "remaining_time": "0:11:47"}
|
584 |
+
{"current_steps": 584, "total_steps": 639, "loss": 0.4283, "lr": 2.240571989017598e-07, "epoch": 2.7417840375586855, "percentage": 91.39, "elapsed_time": "2:02:57", "remaining_time": "0:11:34"}
|
585 |
+
{"current_steps": 585, "total_steps": 639, "loss": 0.4428, "lr": 2.1604239153869e-07, "epoch": 2.7464788732394365, "percentage": 91.55, "elapsed_time": "2:03:10", "remaining_time": "0:11:22"}
|
586 |
+
{"current_steps": 586, "total_steps": 639, "loss": 0.4379, "lr": 2.0817039143947614e-07, "epoch": 2.751173708920188, "percentage": 91.71, "elapsed_time": "2:03:26", "remaining_time": "0:11:09"}
|
587 |
+
{"current_steps": 587, "total_steps": 639, "loss": 0.4394, "lr": 2.0044143359340852e-07, "epoch": 2.755868544600939, "percentage": 91.86, "elapsed_time": "2:03:40", "remaining_time": "0:10:57"}
|
588 |
+
{"current_steps": 588, "total_steps": 639, "loss": 0.4646, "lr": 1.928557487197802e-07, "epoch": 2.76056338028169, "percentage": 92.02, "elapsed_time": "2:03:54", "remaining_time": "0:10:44"}
|
589 |
+
{"current_steps": 589, "total_steps": 639, "loss": 0.4233, "lr": 1.8541356326100436e-07, "epoch": 2.7652582159624415, "percentage": 92.18, "elapsed_time": "2:04:08", "remaining_time": "0:10:32"}
|
590 |
+
{"current_steps": 590, "total_steps": 639, "loss": 0.4748, "lr": 1.7811509937584958e-07, "epoch": 2.7699530516431925, "percentage": 92.33, "elapsed_time": "2:04:25", "remaining_time": "0:10:19"}
|
591 |
+
{"current_steps": 591, "total_steps": 639, "loss": 0.4682, "lr": 1.7096057493281693e-07, "epoch": 2.7746478873239435, "percentage": 92.49, "elapsed_time": "2:04:36", "remaining_time": "0:10:07"}
|
592 |
+
{"current_steps": 592, "total_steps": 639, "loss": 0.4278, "lr": 1.6395020350362557e-07, "epoch": 2.779342723004695, "percentage": 92.64, "elapsed_time": "2:04:50", "remaining_time": "0:09:54"}
|
593 |
+
{"current_steps": 593, "total_steps": 639, "loss": 0.4184, "lr": 1.5708419435684463e-07, "epoch": 2.784037558685446, "percentage": 92.8, "elapsed_time": "2:05:02", "remaining_time": "0:09:41"}
|
594 |
+
{"current_steps": 594, "total_steps": 639, "loss": 0.4181, "lr": 1.5036275245164377e-07, "epoch": 2.788732394366197, "percentage": 92.96, "elapsed_time": "2:05:14", "remaining_time": "0:09:29"}
|
595 |
+
{"current_steps": 595, "total_steps": 639, "loss": 0.4044, "lr": 1.4378607843167635e-07, "epoch": 2.7934272300469485, "percentage": 93.11, "elapsed_time": "2:05:22", "remaining_time": "0:09:16"}
|
596 |
+
{"current_steps": 596, "total_steps": 639, "loss": 0.4191, "lr": 1.3735436861908702e-07, "epoch": 2.7981220657276995, "percentage": 93.27, "elapsed_time": "2:05:32", "remaining_time": "0:09:03"}
|
597 |
+
{"current_steps": 597, "total_steps": 639, "loss": 0.4315, "lr": 1.3106781500865417e-07, "epoch": 2.802816901408451, "percentage": 93.43, "elapsed_time": "2:05:42", "remaining_time": "0:08:50"}
|
598 |
+
{"current_steps": 598, "total_steps": 639, "loss": 0.4255, "lr": 1.249266052620579e-07, "epoch": 2.807511737089202, "percentage": 93.58, "elapsed_time": "2:05:58", "remaining_time": "0:08:38"}
|
599 |
+
{"current_steps": 599, "total_steps": 639, "loss": 0.431, "lr": 1.1893092270227724e-07, "epoch": 2.812206572769953, "percentage": 93.74, "elapsed_time": "2:06:12", "remaining_time": "0:08:25"}
|
600 |
+
{"current_steps": 600, "total_steps": 639, "loss": 0.4231, "lr": 1.1308094630811784e-07, "epoch": 2.816901408450704, "percentage": 93.9, "elapsed_time": "2:06:23", "remaining_time": "0:08:12"}
|
601 |
+
{"current_steps": 601, "total_steps": 639, "loss": 0.4345, "lr": 1.0737685070887016e-07, "epoch": 2.8215962441314555, "percentage": 94.05, "elapsed_time": "2:06:34", "remaining_time": "0:08:00"}
|
602 |
+
{"current_steps": 602, "total_steps": 639, "loss": 0.4132, "lr": 1.0181880617909701e-07, "epoch": 2.8262910798122065, "percentage": 94.21, "elapsed_time": "2:06:45", "remaining_time": "0:07:47"}
|
603 |
+
{"current_steps": 603, "total_steps": 639, "loss": 0.4231, "lr": 9.640697863354697e-08, "epoch": 2.830985915492958, "percentage": 94.37, "elapsed_time": "2:06:59", "remaining_time": "0:07:34"}
|
604 |
+
{"current_steps": 604, "total_steps": 639, "loss": 0.4228, "lr": 9.114152962220734e-08, "epoch": 2.835680751173709, "percentage": 94.52, "elapsed_time": "2:07:11", "remaining_time": "0:07:22"}
|
605 |
+
{"current_steps": 605, "total_steps": 639, "loss": 0.4299, "lr": 8.602261632547626e-08, "epoch": 2.84037558685446, "percentage": 94.68, "elapsed_time": "2:07:20", "remaining_time": "0:07:09"}
|
606 |
+
{"current_steps": 606, "total_steps": 639, "loss": 0.4384, "lr": 8.10503915494748e-08, "epoch": 2.845070422535211, "percentage": 94.84, "elapsed_time": "2:07:31", "remaining_time": "0:06:56"}
|
607 |
+
{"current_steps": 607, "total_steps": 639, "loss": 0.4364, "lr": 7.622500372148179e-08, "epoch": 2.8497652582159625, "percentage": 94.99, "elapsed_time": "2:07:43", "remaining_time": "0:06:43"}
|
608 |
+
{"current_steps": 608, "total_steps": 639, "loss": 0.4413, "lr": 7.15465968855078e-08, "epoch": 2.8544600938967135, "percentage": 95.15, "elapsed_time": "2:07:56", "remaining_time": "0:06:31"}
|
609 |
+
{"current_steps": 609, "total_steps": 639, "loss": 0.4492, "lr": 6.701531069799039e-08, "epoch": 2.859154929577465, "percentage": 95.31, "elapsed_time": "2:08:13", "remaining_time": "0:06:18"}
|
610 |
+
{"current_steps": 610, "total_steps": 639, "loss": 0.4424, "lr": 6.263128042362676e-08, "epoch": 2.863849765258216, "percentage": 95.46, "elapsed_time": "2:08:25", "remaining_time": "0:06:06"}
|
611 |
+
{"current_steps": 611, "total_steps": 639, "loss": 0.4239, "lr": 5.839463693133873e-08, "epoch": 2.868544600938967, "percentage": 95.62, "elapsed_time": "2:08:36", "remaining_time": "0:05:53"}
|
612 |
+
{"current_steps": 612, "total_steps": 639, "loss": 0.4438, "lr": 5.4305506690362495e-08, "epoch": 2.873239436619718, "percentage": 95.77, "elapsed_time": "2:08:46", "remaining_time": "0:05:40"}
|
613 |
+
{"current_steps": 613, "total_steps": 639, "loss": 0.4412, "lr": 5.036401176647332e-08, "epoch": 2.8779342723004695, "percentage": 95.93, "elapsed_time": "2:09:02", "remaining_time": "0:05:28"}
|
614 |
+
{"current_steps": 614, "total_steps": 639, "loss": 0.4302, "lr": 4.657026981834623e-08, "epoch": 2.8826291079812205, "percentage": 96.09, "elapsed_time": "2:09:14", "remaining_time": "0:05:15"}
|
615 |
+
{"current_steps": 615, "total_steps": 639, "loss": 0.4434, "lr": 4.292439409403826e-08, "epoch": 2.887323943661972, "percentage": 96.24, "elapsed_time": "2:09:25", "remaining_time": "0:05:03"}
|
616 |
+
{"current_steps": 616, "total_steps": 639, "loss": 0.463, "lr": 3.9426493427611177e-08, "epoch": 2.892018779342723, "percentage": 96.4, "elapsed_time": "2:09:36", "remaining_time": "0:04:50"}
|
617 |
+
{"current_steps": 617, "total_steps": 639, "loss": 0.4276, "lr": 3.6076672235880737e-08, "epoch": 2.896713615023474, "percentage": 96.56, "elapsed_time": "2:09:46", "remaining_time": "0:04:37"}
|
618 |
+
{"current_steps": 618, "total_steps": 639, "loss": 0.4171, "lr": 3.287503051530194e-08, "epoch": 2.9014084507042255, "percentage": 96.71, "elapsed_time": "2:10:03", "remaining_time": "0:04:25"}
|
619 |
+
{"current_steps": 619, "total_steps": 639, "loss": 0.4061, "lr": 2.9821663838981994e-08, "epoch": 2.9061032863849765, "percentage": 96.87, "elapsed_time": "2:10:15", "remaining_time": "0:04:12"}
|
620 |
+
{"current_steps": 620, "total_steps": 639, "loss": 0.4338, "lr": 2.6916663353828142e-08, "epoch": 2.910798122065728, "percentage": 97.03, "elapsed_time": "2:10:28", "remaining_time": "0:03:59"}
|
621 |
+
{"current_steps": 621, "total_steps": 639, "loss": 0.415, "lr": 2.416011577782651e-08, "epoch": 2.915492957746479, "percentage": 97.18, "elapsed_time": "2:10:39", "remaining_time": "0:03:47"}
|
622 |
+
{"current_steps": 622, "total_steps": 639, "loss": 0.442, "lr": 2.1552103397454725e-08, "epoch": 2.92018779342723, "percentage": 97.34, "elapsed_time": "2:10:56", "remaining_time": "0:03:34"}
|
623 |
+
{"current_steps": 623, "total_steps": 639, "loss": 0.4371, "lr": 1.909270406522279e-08, "epoch": 2.924882629107981, "percentage": 97.5, "elapsed_time": "2:11:13", "remaining_time": "0:03:22"}
|
624 |
+
{"current_steps": 624, "total_steps": 639, "loss": 0.4063, "lr": 1.6781991197352133e-08, "epoch": 2.9295774647887325, "percentage": 97.65, "elapsed_time": "2:11:24", "remaining_time": "0:03:09"}
|
625 |
+
{"current_steps": 625, "total_steps": 639, "loss": 0.4113, "lr": 1.4620033771582942e-08, "epoch": 2.9342723004694835, "percentage": 97.81, "elapsed_time": "2:11:33", "remaining_time": "0:02:56"}
|
626 |
+
{"current_steps": 626, "total_steps": 639, "loss": 0.4048, "lr": 1.2606896325113582e-08, "epoch": 2.938967136150235, "percentage": 97.97, "elapsed_time": "2:11:42", "remaining_time": "0:02:44"}
|
627 |
+
{"current_steps": 627, "total_steps": 639, "loss": 0.4571, "lr": 1.0742638952676577e-08, "epoch": 2.943661971830986, "percentage": 98.12, "elapsed_time": "2:11:52", "remaining_time": "0:02:31"}
|
628 |
+
{"current_steps": 628, "total_steps": 639, "loss": 0.4387, "lr": 9.027317304742267e-09, "epoch": 2.948356807511737, "percentage": 98.28, "elapsed_time": "2:12:07", "remaining_time": "0:02:18"}
|
629 |
+
{"current_steps": 629, "total_steps": 639, "loss": 0.4065, "lr": 7.460982585860144e-09, "epoch": 2.953051643192488, "percentage": 98.44, "elapsed_time": "2:12:21", "remaining_time": "0:02:06"}
|
630 |
+
{"current_steps": 630, "total_steps": 639, "loss": 0.4382, "lr": 6.0436815531284e-09, "epoch": 2.9577464788732395, "percentage": 98.59, "elapsed_time": "2:12:32", "remaining_time": "0:01:53"}
|
631 |
+
{"current_steps": 631, "total_steps": 639, "loss": 0.4521, "lr": 4.7754565147983824e-09, "epoch": 2.9624413145539905, "percentage": 98.75, "elapsed_time": "2:12:41", "remaining_time": "0:01:40"}
|
632 |
+
{"current_steps": 632, "total_steps": 639, "loss": 0.4514, "lr": 3.6563453290122675e-09, "epoch": 2.967136150234742, "percentage": 98.9, "elapsed_time": "2:12:52", "remaining_time": "0:01:28"}
|
633 |
+
{"current_steps": 633, "total_steps": 639, "loss": 0.4344, "lr": 2.68638140267341e-09, "epoch": 2.971830985915493, "percentage": 99.06, "elapsed_time": "2:13:08", "remaining_time": "0:01:15"}
|
634 |
+
{"current_steps": 634, "total_steps": 639, "loss": 0.4214, "lr": 1.865593690446588e-09, "epoch": 2.976525821596244, "percentage": 99.22, "elapsed_time": "2:13:20", "remaining_time": "0:01:03"}
|
635 |
+
{"current_steps": 635, "total_steps": 639, "loss": 0.4458, "lr": 1.1940066938981309e-09, "epoch": 2.981220657276995, "percentage": 99.37, "elapsed_time": "2:13:29", "remaining_time": "0:00:50"}
|
636 |
+
{"current_steps": 636, "total_steps": 639, "loss": 0.4048, "lr": 6.71640460759293e-10, "epoch": 2.9859154929577465, "percentage": 99.53, "elapsed_time": "2:13:38", "remaining_time": "0:00:37"}
|
637 |
+
{"current_steps": 637, "total_steps": 639, "loss": 0.4044, "lr": 2.9851058433116865e-10, "epoch": 2.9906103286384975, "percentage": 99.69, "elapsed_time": "2:13:51", "remaining_time": "0:00:25"}
|
638 |
+
{"current_steps": 638, "total_steps": 639, "loss": 0.4259, "lr": 7.462820301951113e-11, "epoch": 2.995305164319249, "percentage": 99.84, "elapsed_time": "2:14:06", "remaining_time": "0:00:12"}
|
639 |
+
{"current_steps": 639, "total_steps": 639, "loss": 0.4053, "lr": 0.0, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:14:19", "remaining_time": "0:00:00"}
|
640 |
+
{"current_steps": 639, "total_steps": 639, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:15:50", "remaining_time": "0:00:00"}
|