Training in progress, step 459
Browse files
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4986211280
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9789b03be10afb07471a4b74796a5001da46752c47c4d2235258f177016a43ec
|
3 |
size 4986211280
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26732334a0c5893ab3faa0ea1c0e4d7a637b076d9b332bbdcd4dc3b00919dbc2
|
3 |
size 4954847344
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b73376a731dc58b7cde2d0ab810bb5e27219f2afeea36f4117915bbb57832e3
|
3 |
size 4954847392
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a4c78924a2e564c9d5b4c6310ea13d00141f082cbc4255854ccbfd818cc2176
|
3 |
size 4954847392
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbeb70a36dbeaf6d65a0d25641b07ec99072d58e1e5951a62119f31eff2cc04c
|
3 |
size 4954847392
|
model-00006-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4734533160
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86ac5ec08886255eed3335af99a806a203766117eee17cc3a335a907e8a42106
|
3 |
size 4734533160
|
trainer_log.jsonl
CHANGED
@@ -401,3 +401,60 @@
|
|
401 |
{"current_steps": 401, "total_steps": 459, "loss": 0.0842, "lr": 4.951556604879049e-07, "epoch": 2.6071817192600655, "percentage": 87.36, "elapsed_time": "7:45:40", "remaining_time": "1:07:21"}
|
402 |
{"current_steps": 402, "total_steps": 459, "loss": 0.1044, "lr": 4.787838990956228e-07, "epoch": 2.6137105549510338, "percentage": 87.58, "elapsed_time": "7:46:55", "remaining_time": "1:06:12"}
|
403 |
{"current_steps": 403, "total_steps": 459, "loss": 0.0838, "lr": 4.62673746783317e-07, "epoch": 2.620239390642002, "percentage": 87.8, "elapsed_time": "7:47:54", "remaining_time": "1:05:01"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
401 |
{"current_steps": 401, "total_steps": 459, "loss": 0.0842, "lr": 4.951556604879049e-07, "epoch": 2.6071817192600655, "percentage": 87.36, "elapsed_time": "7:45:40", "remaining_time": "1:07:21"}
|
402 |
{"current_steps": 402, "total_steps": 459, "loss": 0.1044, "lr": 4.787838990956228e-07, "epoch": 2.6137105549510338, "percentage": 87.58, "elapsed_time": "7:46:55", "remaining_time": "1:06:12"}
|
403 |
{"current_steps": 403, "total_steps": 459, "loss": 0.0838, "lr": 4.62673746783317e-07, "epoch": 2.620239390642002, "percentage": 87.8, "elapsed_time": "7:47:54", "remaining_time": "1:05:01"}
|
404 |
+
{"current_steps": 404, "total_steps": 459, "loss": 0.0997, "lr": 4.468261357254339e-07, "epoch": 2.6267682263329704, "percentage": 88.02, "elapsed_time": "7:49:04", "remaining_time": "1:03:51"}
|
405 |
+
{"current_steps": 405, "total_steps": 459, "loss": 0.0896, "lr": 4.312419829051173e-07, "epoch": 2.633297062023939, "percentage": 88.24, "elapsed_time": "7:50:11", "remaining_time": "1:02:41"}
|
406 |
+
{"current_steps": 406, "total_steps": 459, "loss": 0.079, "lr": 4.1592219006114597e-07, "epoch": 2.6398258977149074, "percentage": 88.45, "elapsed_time": "7:51:15", "remaining_time": "1:01:31"}
|
407 |
+
{"current_steps": 407, "total_steps": 459, "loss": 0.1053, "lr": 4.008676436357539e-07, "epoch": 2.646354733405876, "percentage": 88.67, "elapsed_time": "7:52:21", "remaining_time": "1:00:20"}
|
408 |
+
{"current_steps": 408, "total_steps": 459, "loss": 0.0861, "lr": 3.86079214723345e-07, "epoch": 2.6528835690968444, "percentage": 88.89, "elapsed_time": "7:53:30", "remaining_time": "0:59:11"}
|
409 |
+
{"current_steps": 409, "total_steps": 459, "loss": 0.0892, "lr": 3.7155775902008527e-07, "epoch": 2.6594124047878127, "percentage": 89.11, "elapsed_time": "7:54:50", "remaining_time": "0:58:03"}
|
410 |
+
{"current_steps": 410, "total_steps": 459, "loss": 0.0988, "lr": 3.5730411677439125e-07, "epoch": 2.6659412404787814, "percentage": 89.32, "elapsed_time": "7:56:10", "remaining_time": "0:56:54"}
|
411 |
+
{"current_steps": 411, "total_steps": 459, "loss": 0.0954, "lr": 3.433191127383079e-07, "epoch": 2.6724700761697497, "percentage": 89.54, "elapsed_time": "7:57:30", "remaining_time": "0:55:46"}
|
412 |
+
{"current_steps": 412, "total_steps": 459, "loss": 0.089, "lr": 3.2960355611979245e-07, "epoch": 2.678998911860718, "percentage": 89.76, "elapsed_time": "7:58:39", "remaining_time": "0:54:36"}
|
413 |
+
{"current_steps": 413, "total_steps": 459, "loss": 0.1022, "lr": 3.1615824053588764e-07, "epoch": 2.6855277475516868, "percentage": 89.98, "elapsed_time": "7:59:33", "remaining_time": "0:53:24"}
|
414 |
+
{"current_steps": 414, "total_steps": 459, "loss": 0.0891, "lr": 3.029839439668003e-07, "epoch": 2.692056583242655, "percentage": 90.2, "elapsed_time": "8:00:32", "remaining_time": "0:52:13"}
|
415 |
+
{"current_steps": 415, "total_steps": 459, "loss": 0.0902, "lr": 2.9008142871088665e-07, "epoch": 2.6985854189336234, "percentage": 90.41, "elapsed_time": "8:01:34", "remaining_time": "0:51:03"}
|
416 |
+
{"current_steps": 416, "total_steps": 459, "loss": 0.0914, "lr": 2.774514413405444e-07, "epoch": 2.705114254624592, "percentage": 90.63, "elapsed_time": "8:02:52", "remaining_time": "0:49:54"}
|
417 |
+
{"current_steps": 417, "total_steps": 459, "loss": 0.0857, "lr": 2.6509471265901476e-07, "epoch": 2.7116430903155604, "percentage": 90.85, "elapsed_time": "8:04:04", "remaining_time": "0:48:45"}
|
418 |
+
{"current_steps": 418, "total_steps": 459, "loss": 0.0835, "lr": 2.530119576580936e-07, "epoch": 2.7181719260065287, "percentage": 91.07, "elapsed_time": "8:05:25", "remaining_time": "0:47:36"}
|
419 |
+
{"current_steps": 419, "total_steps": 459, "loss": 0.0886, "lr": 2.412038754767626e-07, "epoch": 2.7247007616974974, "percentage": 91.29, "elapsed_time": "8:06:24", "remaining_time": "0:46:26"}
|
420 |
+
{"current_steps": 420, "total_steps": 459, "loss": 0.1014, "lr": 2.2967114936073342e-07, "epoch": 2.7312295973884657, "percentage": 91.5, "elapsed_time": "8:07:26", "remaining_time": "0:45:15"}
|
421 |
+
{"current_steps": 421, "total_steps": 459, "loss": 0.0848, "lr": 2.1841444662291543e-07, "epoch": 2.737758433079434, "percentage": 91.72, "elapsed_time": "8:08:25", "remaining_time": "0:44:05"}
|
422 |
+
{"current_steps": 422, "total_steps": 459, "loss": 0.0874, "lr": 2.0743441860480218e-07, "epoch": 2.7442872687704027, "percentage": 91.94, "elapsed_time": "8:09:34", "remaining_time": "0:42:55"}
|
423 |
+
{"current_steps": 423, "total_steps": 459, "loss": 0.0971, "lr": 1.967317006387831e-07, "epoch": 2.750816104461371, "percentage": 92.16, "elapsed_time": "8:10:31", "remaining_time": "0:41:44"}
|
424 |
+
{"current_steps": 424, "total_steps": 459, "loss": 0.0849, "lr": 1.863069120113814e-07, "epoch": 2.7573449401523398, "percentage": 92.37, "elapsed_time": "8:11:36", "remaining_time": "0:40:34"}
|
425 |
+
{"current_steps": 425, "total_steps": 459, "loss": 0.0869, "lr": 1.7616065592742038e-07, "epoch": 2.763873775843308, "percentage": 92.59, "elapsed_time": "8:12:54", "remaining_time": "0:39:25"}
|
426 |
+
{"current_steps": 426, "total_steps": 459, "loss": 0.0775, "lr": 1.6629351947512195e-07, "epoch": 2.7704026115342764, "percentage": 92.81, "elapsed_time": "8:13:50", "remaining_time": "0:38:15"}
|
427 |
+
{"current_steps": 427, "total_steps": 459, "loss": 0.0801, "lr": 1.5670607359213442e-07, "epoch": 2.7769314472252447, "percentage": 93.03, "elapsed_time": "8:15:02", "remaining_time": "0:37:05"}
|
428 |
+
{"current_steps": 428, "total_steps": 459, "loss": 0.0801, "lr": 1.4739887303249877e-07, "epoch": 2.7834602829162134, "percentage": 93.25, "elapsed_time": "8:15:59", "remaining_time": "0:35:55"}
|
429 |
+
{"current_steps": 429, "total_steps": 459, "loss": 0.0795, "lr": 1.3837245633454512e-07, "epoch": 2.7899891186071817, "percentage": 93.46, "elapsed_time": "8:16:59", "remaining_time": "0:34:45"}
|
430 |
+
{"current_steps": 430, "total_steps": 459, "loss": 0.076, "lr": 1.2962734578973568e-07, "epoch": 2.7965179542981504, "percentage": 93.68, "elapsed_time": "8:17:57", "remaining_time": "0:33:35"}
|
431 |
+
{"current_steps": 431, "total_steps": 459, "loss": 0.0898, "lr": 1.2116404741244204e-07, "epoch": 2.8030467899891187, "percentage": 93.9, "elapsed_time": "8:19:08", "remaining_time": "0:32:25"}
|
432 |
+
{"current_steps": 432, "total_steps": 459, "loss": 0.0848, "lr": 1.1298305091066664e-07, "epoch": 2.809575625680087, "percentage": 94.12, "elapsed_time": "8:20:19", "remaining_time": "0:31:16"}
|
433 |
+
{"current_steps": 433, "total_steps": 459, "loss": 0.0849, "lr": 1.0508482965770506e-07, "epoch": 2.8161044613710553, "percentage": 94.34, "elapsed_time": "8:21:46", "remaining_time": "0:30:07"}
|
434 |
+
{"current_steps": 434, "total_steps": 459, "loss": 0.0793, "lr": 9.746984066475728e-08, "epoch": 2.822633297062024, "percentage": 94.55, "elapsed_time": "8:23:01", "remaining_time": "0:28:58"}
|
435 |
+
{"current_steps": 435, "total_steps": 459, "loss": 0.088, "lr": 9.013852455448335e-08, "epoch": 2.8291621327529923, "percentage": 94.77, "elapsed_time": "8:23:59", "remaining_time": "0:27:48"}
|
436 |
+
{"current_steps": 436, "total_steps": 459, "loss": 0.0994, "lr": 8.309130553550815e-08, "epoch": 2.835690968443961, "percentage": 94.99, "elapsed_time": "8:25:02", "remaining_time": "0:26:38"}
|
437 |
+
{"current_steps": 437, "total_steps": 459, "loss": 0.0919, "lr": 7.632859137787329e-08, "epoch": 2.8422198041349294, "percentage": 95.21, "elapsed_time": "8:26:05", "remaining_time": "0:25:28"}
|
438 |
+
{"current_steps": 438, "total_steps": 459, "loss": 0.0878, "lr": 6.985077338944656e-08, "epoch": 2.8487486398258977, "percentage": 95.42, "elapsed_time": "8:27:04", "remaining_time": "0:24:18"}
|
439 |
+
{"current_steps": 439, "total_steps": 459, "loss": 0.0918, "lr": 6.365822639327724e-08, "epoch": 2.855277475516866, "percentage": 95.64, "elapsed_time": "8:28:16", "remaining_time": "0:23:09"}
|
440 |
+
{"current_steps": 440, "total_steps": 459, "loss": 0.0693, "lr": 5.775130870590784e-08, "epoch": 2.8618063112078347, "percentage": 95.86, "elapsed_time": "8:29:23", "remaining_time": "0:21:59"}
|
441 |
+
{"current_steps": 441, "total_steps": 459, "loss": 0.0873, "lr": 5.213036211664191e-08, "epoch": 2.868335146898803, "percentage": 96.08, "elapsed_time": "8:30:28", "remaining_time": "0:20:50"}
|
442 |
+
{"current_steps": 442, "total_steps": 459, "loss": 0.0957, "lr": 4.6795711867766436e-08, "epoch": 2.8748639825897717, "percentage": 96.3, "elapsed_time": "8:31:22", "remaining_time": "0:19:40"}
|
443 |
+
{"current_steps": 443, "total_steps": 459, "loss": 0.0954, "lr": 4.1747666635733594e-08, "epoch": 2.88139281828074, "percentage": 96.51, "elapsed_time": "8:32:21", "remaining_time": "0:18:30"}
|
444 |
+
{"current_steps": 444, "total_steps": 459, "loss": 0.0704, "lr": 3.698651851329838e-08, "epoch": 2.8879216539717083, "percentage": 96.73, "elapsed_time": "8:33:41", "remaining_time": "0:17:21"}
|
445 |
+
{"current_steps": 445, "total_steps": 459, "loss": 0.0777, "lr": 3.251254299261875e-08, "epoch": 2.8944504896626766, "percentage": 96.95, "elapsed_time": "8:34:49", "remaining_time": "0:16:11"}
|
446 |
+
{"current_steps": 446, "total_steps": 459, "loss": 0.088, "lr": 2.8325998949314536e-08, "epoch": 2.9009793253536453, "percentage": 97.17, "elapsed_time": "8:36:01", "remaining_time": "0:15:02"}
|
447 |
+
{"current_steps": 447, "total_steps": 459, "loss": 0.0781, "lr": 2.442712862748775e-08, "epoch": 2.9075081610446136, "percentage": 97.39, "elapsed_time": "8:37:16", "remaining_time": "0:13:53"}
|
448 |
+
{"current_steps": 448, "total_steps": 459, "loss": 0.0937, "lr": 2.0816157625706547e-08, "epoch": 2.9140369967355824, "percentage": 97.6, "elapsed_time": "8:37:58", "remaining_time": "0:12:43"}
|
449 |
+
{"current_steps": 449, "total_steps": 459, "loss": 0.1076, "lr": 1.749329488395124e-08, "epoch": 2.9205658324265507, "percentage": 97.82, "elapsed_time": "8:38:52", "remaining_time": "0:11:33"}
|
450 |
+
{"current_steps": 450, "total_steps": 459, "loss": 0.0781, "lr": 1.4458732671523978e-08, "epoch": 2.927094668117519, "percentage": 98.04, "elapsed_time": "8:40:01", "remaining_time": "0:10:24"}
|
451 |
+
{"current_steps": 451, "total_steps": 459, "loss": 0.0824, "lr": 1.1712646575922637e-08, "epoch": 2.9336235038084872, "percentage": 98.26, "elapsed_time": "8:41:14", "remaining_time": "0:09:14"}
|
452 |
+
{"current_steps": 452, "total_steps": 459, "loss": 0.0864, "lr": 9.25519549268561e-09, "epoch": 2.940152339499456, "percentage": 98.47, "elapsed_time": "8:42:11", "remaining_time": "0:08:05"}
|
453 |
+
{"current_steps": 453, "total_steps": 459, "loss": 0.0966, "lr": 7.0865216161902785e-09, "epoch": 2.9466811751904243, "percentage": 98.69, "elapsed_time": "8:43:22", "remaining_time": "0:06:55"}
|
454 |
+
{"current_steps": 454, "total_steps": 459, "loss": 0.074, "lr": 5.2067504314323725e-09, "epoch": 2.953210010881393, "percentage": 98.91, "elapsed_time": "8:44:36", "remaining_time": "0:05:46"}
|
455 |
+
{"current_steps": 455, "total_steps": 459, "loss": 0.0893, "lr": 3.6159907067601086e-09, "epoch": 2.9597388465723613, "percentage": 99.13, "elapsed_time": "8:45:41", "remaining_time": "0:04:37"}
|
456 |
+
{"current_steps": 456, "total_steps": 459, "loss": 0.0993, "lr": 2.314334487583114e-09, "epoch": 2.9662676822633296, "percentage": 99.35, "elapsed_time": "8:46:47", "remaining_time": "0:03:27"}
|
457 |
+
{"current_steps": 457, "total_steps": 459, "loss": 0.0763, "lr": 1.3018570910466876e-09, "epoch": 2.972796517954298, "percentage": 99.56, "elapsed_time": "8:47:59", "remaining_time": "0:02:18"}
|
458 |
+
{"current_steps": 458, "total_steps": 459, "loss": 0.0899, "lr": 5.78617101670842e-10, "epoch": 2.9793253536452666, "percentage": 99.78, "elapsed_time": "8:49:04", "remaining_time": "0:01:09"}
|
459 |
+
{"current_steps": 459, "total_steps": 459, "loss": 0.0834, "lr": 1.4465636796412442e-10, "epoch": 2.985854189336235, "percentage": 100.0, "elapsed_time": "8:50:14", "remaining_time": "0:00:00"}
|
460 |
+
{"current_steps": 459, "total_steps": 459, "epoch": 2.985854189336235, "percentage": 100.0, "elapsed_time": "8:54:12", "remaining_time": "0:00:00"}
|