Training in progress, step 426
Browse files- model-00001-of-00014.safetensors +1 -1
- model-00002-of-00014.safetensors +1 -1
- model-00003-of-00014.safetensors +1 -1
- model-00004-of-00014.safetensors +1 -1
- model-00005-of-00014.safetensors +1 -1
- model-00006-of-00014.safetensors +1 -1
- model-00007-of-00014.safetensors +1 -1
- model-00008-of-00014.safetensors +1 -1
- model-00009-of-00014.safetensors +1 -1
- model-00010-of-00014.safetensors +1 -1
- model-00011-of-00014.safetensors +1 -1
- model-00012-of-00014.safetensors +1 -1
- model-00013-of-00014.safetensors +1 -1
- model-00014-of-00014.safetensors +1 -1
- trainer_log.jsonl +24 -0
model-00001-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4891730992
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43b40c525792ad3e6de5589b17eaff211e15b401bd0d5e92b320e065a6ea74ec
|
3 |
size 4891730992
|
model-00002-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c372762ea93be26175d7d35ea249d253fb286a52bbd5b0dd566edcf49cd389e
|
3 |
size 4876059352
|
model-00003-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059384
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b939e2451796009d72707e8e83f80eae06ce48ff2e7e9424872e380ad17d4a8
|
3 |
size 4876059384
|
model-00004-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e148ca37108944eca7118b85d268a60c169eb890c5e2f1267bacd98a1d00724c
|
3 |
size 4876059416
|
model-00005-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87225c1e4ddadd76ef0da03a351f54eaf3fade47d1e4887379a8e0110d257dcc
|
3 |
size 4876059416
|
model-00006-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31cb3d659d727a91cb661042610b3212af83e1c186b6a8d1a9b5f7c058c1f576
|
3 |
size 4876059416
|
model-00007-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fafbc1cc3b179ee4394d528e6c8565324df990c766c4c59e4a0567b837f48840
|
3 |
size 4876059416
|
model-00008-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:394130d1b9a6e83e6385a7f75db89a98dff617a05817515a7328366722aaa9bc
|
3 |
size 4876059416
|
model-00009-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5059985f7ab222e7541286dbad063e738ad81790a0f8ced9475ba37dcc4430b5
|
3 |
size 4876059416
|
model-00010-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6eb7a69b99b57eeeb4c561f410f6790b5b4dc7231219438b33063b1c0144aa18
|
3 |
size 4876059416
|
model-00011-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbaf0084a117d434669b8ef0acd70c439c7086367d6f0c33618c220649178faa
|
3 |
size 4876059416
|
model-00012-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1be3d2bb093a5655e75c89047659f04f9a388c1cc3bb5389bebd2a0f3df6aec
|
3 |
size 4876059416
|
model-00013-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66dbfa165fec0bea19e0bd610bbf54808bc715039aeb4c782061f6294586cfc0
|
3 |
size 4876059416
|
model-00014-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2123397800
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7139404dd7facea1e774d18faa69171e0791a9c49f57abaa95eddf890f08b881
|
3 |
size 2123397800
|
trainer_log.jsonl
CHANGED
@@ -401,3 +401,27 @@
|
|
401 |
{"current_steps": 401, "total_steps": 426, "loss": 0.2217, "lr": 1.0476103796312254e-07, "epoch": 2.807962529274005, "percentage": 94.13, "elapsed_time": "15:04:34", "remaining_time": "0:56:23"}
|
402 |
{"current_steps": 402, "total_steps": 426, "loss": 0.2113, "lr": 9.657431935277629e-08, "epoch": 2.8149882903981265, "percentage": 94.37, "elapsed_time": "15:06:43", "remaining_time": "0:54:07"}
|
403 |
{"current_steps": 403, "total_steps": 426, "loss": 0.2032, "lr": 8.871751368978554e-08, "epoch": 2.822014051522248, "percentage": 94.6, "elapsed_time": "15:08:50", "remaining_time": "0:51:52"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
401 |
{"current_steps": 401, "total_steps": 426, "loss": 0.2217, "lr": 1.0476103796312254e-07, "epoch": 2.807962529274005, "percentage": 94.13, "elapsed_time": "15:04:34", "remaining_time": "0:56:23"}
|
402 |
{"current_steps": 402, "total_steps": 426, "loss": 0.2113, "lr": 9.657431935277629e-08, "epoch": 2.8149882903981265, "percentage": 94.37, "elapsed_time": "15:06:43", "remaining_time": "0:54:07"}
|
403 |
{"current_steps": 403, "total_steps": 426, "loss": 0.2032, "lr": 8.871751368978554e-08, "epoch": 2.822014051522248, "percentage": 94.6, "elapsed_time": "15:08:50", "remaining_time": "0:51:52"}
|
404 |
+
{"current_steps": 404, "total_steps": 426, "loss": 0.19, "lr": 8.119114959680929e-08, "epoch": 2.82903981264637, "percentage": 94.84, "elapsed_time": "15:11:01", "remaining_time": "0:49:36"}
|
405 |
+
{"current_steps": 405, "total_steps": 426, "loss": 0.2377, "lr": 7.399573346368871e-08, "epoch": 2.836065573770492, "percentage": 95.07, "elapsed_time": "15:13:07", "remaining_time": "0:47:20"}
|
406 |
+
{"current_steps": 406, "total_steps": 426, "loss": 0.2307, "lr": 6.713174941338163e-08, "epoch": 2.8430913348946136, "percentage": 95.31, "elapsed_time": "15:15:12", "remaining_time": "0:45:05"}
|
407 |
+
{"current_steps": 407, "total_steps": 426, "loss": 0.1509, "lr": 6.05996592693886e-08, "epoch": 2.850117096018735, "percentage": 95.54, "elapsed_time": "15:18:17", "remaining_time": "0:42:52"}
|
408 |
+
{"current_steps": 408, "total_steps": 426, "loss": 0.2429, "lr": 5.439990252467886e-08, "epoch": 2.857142857142857, "percentage": 95.77, "elapsed_time": "15:22:04", "remaining_time": "0:40:40"}
|
409 |
+
{"current_steps": 409, "total_steps": 426, "loss": 0.2302, "lr": 4.853289631212066e-08, "epoch": 2.8641686182669788, "percentage": 96.01, "elapsed_time": "15:26:35", "remaining_time": "0:38:30"}
|
410 |
+
{"current_steps": 410, "total_steps": 426, "loss": 0.1985, "lr": 4.299903537641703e-08, "epoch": 2.871194379391101, "percentage": 96.24, "elapsed_time": "15:28:54", "remaining_time": "0:36:15"}
|
411 |
+
{"current_steps": 411, "total_steps": 426, "loss": 0.2277, "lr": 3.779869204754427e-08, "epoch": 2.8782201405152223, "percentage": 96.48, "elapsed_time": "15:31:02", "remaining_time": "0:33:58"}
|
412 |
+
{"current_steps": 412, "total_steps": 426, "loss": 0.1957, "lr": 3.2932216215704195e-08, "epoch": 2.8852459016393444, "percentage": 96.71, "elapsed_time": "15:33:11", "remaining_time": "0:31:42"}
|
413 |
+
{"current_steps": 413, "total_steps": 426, "loss": 0.1988, "lr": 2.8399935307778516e-08, "epoch": 2.892271662763466, "percentage": 96.95, "elapsed_time": "15:35:54", "remaining_time": "0:29:27"}
|
414 |
+
{"current_steps": 414, "total_steps": 426, "loss": 0.1873, "lr": 2.420215426530259e-08, "epoch": 2.899297423887588, "percentage": 97.18, "elapsed_time": "15:39:00", "remaining_time": "0:27:13"}
|
415 |
+
{"current_steps": 415, "total_steps": 426, "loss": 0.1845, "lr": 2.0339155523945164e-08, "epoch": 2.9063231850117095, "percentage": 97.42, "elapsed_time": "15:41:49", "remaining_time": "0:24:57"}
|
416 |
+
{"current_steps": 416, "total_steps": 426, "loss": 0.208, "lr": 1.681119899450856e-08, "epoch": 2.9133489461358315, "percentage": 97.65, "elapsed_time": "15:44:01", "remaining_time": "0:22:41"}
|
417 |
+
{"current_steps": 417, "total_steps": 426, "loss": 0.2026, "lr": 1.3618522045439897e-08, "epoch": 2.920374707259953, "percentage": 97.89, "elapsed_time": "15:46:10", "remaining_time": "0:20:25"}
|
418 |
+
{"current_steps": 418, "total_steps": 426, "loss": 0.2024, "lr": 1.0761339486859424e-08, "epoch": 2.927400468384075, "percentage": 98.12, "elapsed_time": "15:48:21", "remaining_time": "0:18:09"}
|
419 |
+
{"current_steps": 419, "total_steps": 426, "loss": 0.1698, "lr": 8.239843556108739e-09, "epoch": 2.9344262295081966, "percentage": 98.36, "elapsed_time": "15:50:31", "remaining_time": "0:15:52"}
|
420 |
+
{"current_steps": 420, "total_steps": 426, "loss": 0.2337, "lr": 6.054203904817812e-09, "epoch": 2.9414519906323187, "percentage": 98.59, "elapsed_time": "15:52:40", "remaining_time": "0:13:36"}
|
421 |
+
{"current_steps": 421, "total_steps": 426, "loss": 0.2318, "lr": 4.204567587486885e-09, "epoch": 2.9484777517564402, "percentage": 98.83, "elapsed_time": "15:54:38", "remaining_time": "0:11:20"}
|
422 |
+
{"current_steps": 422, "total_steps": 426, "loss": 0.1856, "lr": 2.6910590515966117e-09, "epoch": 2.9555035128805622, "percentage": 99.06, "elapsed_time": "15:56:47", "remaining_time": "0:09:04"}
|
423 |
+
{"current_steps": 423, "total_steps": 426, "loss": 0.227, "lr": 1.5137801292325338e-09, "epoch": 2.962529274004684, "percentage": 99.3, "elapsed_time": "15:58:53", "remaining_time": "0:06:48"}
|
424 |
+
{"current_steps": 424, "total_steps": 426, "loss": 0.1856, "lr": 6.728100302327844e-10, "epoch": 2.9695550351288054, "percentage": 99.53, "elapsed_time": "16:00:55", "remaining_time": "0:04:31"}
|
425 |
+
{"current_steps": 425, "total_steps": 426, "loss": 0.2299, "lr": 1.6820533686179308e-10, "epoch": 2.9765807962529274, "percentage": 99.77, "elapsed_time": "16:03:07", "remaining_time": "0:02:15"}
|
426 |
+
{"current_steps": 426, "total_steps": 426, "loss": 0.1971, "lr": 0.0, "epoch": 2.9836065573770494, "percentage": 100.0, "elapsed_time": "16:05:03", "remaining_time": "0:00:00"}
|
427 |
+
{"current_steps": 426, "total_steps": 426, "epoch": 2.9836065573770494, "percentage": 100.0, "elapsed_time": "16:15:22", "remaining_time": "0:00:00"}
|