Training in progress, step 1524
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f845b7ee39b514b8ec237be4f79636b06142db4f13b92c30175733c643ec948
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2ada0085f2db1b7c4f12039a2830c108327f27affeb6eadfaf83c47334524ac
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96d2f324e8e7e9e21c3559a43fa69cdd6c2569e0327659c23950d22a25246d2d
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e07bf74e69d542060b4d89a0d7db034eeaefdad969e6a94954ac94c26456386
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -1501,3 +1501,25 @@
|
|
1501 |
{"current_steps": 1501, "total_steps": 1524, "loss": 0.4116, "lr": 6.942565518810451e-09, "epoch": 2.950851900393185, "percentage": 98.49, "elapsed_time": "22:31:55", "remaining_time": "0:20:42"}
|
1502 |
{"current_steps": 1502, "total_steps": 1524, "loss": 0.3971, "lr": 6.352113192141241e-09, "epoch": 2.9528178243774574, "percentage": 98.56, "elapsed_time": "22:32:49", "remaining_time": "0:19:48"}
|
1503 |
{"current_steps": 1503, "total_steps": 1524, "loss": 0.4305, "lr": 5.787881461636891e-09, "epoch": 2.95478374836173, "percentage": 98.62, "elapsed_time": "22:33:42", "remaining_time": "0:18:54"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1501 |
{"current_steps": 1501, "total_steps": 1524, "loss": 0.4116, "lr": 6.942565518810451e-09, "epoch": 2.950851900393185, "percentage": 98.49, "elapsed_time": "22:31:55", "remaining_time": "0:20:42"}
|
1502 |
{"current_steps": 1502, "total_steps": 1524, "loss": 0.3971, "lr": 6.352113192141241e-09, "epoch": 2.9528178243774574, "percentage": 98.56, "elapsed_time": "22:32:49", "remaining_time": "0:19:48"}
|
1503 |
{"current_steps": 1503, "total_steps": 1524, "loss": 0.4305, "lr": 5.787881461636891e-09, "epoch": 2.95478374836173, "percentage": 98.62, "elapsed_time": "22:33:42", "remaining_time": "0:18:54"}
|
1504 |
+
{"current_steps": 1504, "total_steps": 1524, "loss": 0.4107, "lr": 5.24987328995974e-09, "epoch": 2.9567496723460027, "percentage": 98.69, "elapsed_time": "22:34:35", "remaining_time": "0:18:00"}
|
1505 |
+
{"current_steps": 1505, "total_steps": 1524, "loss": 0.4312, "lr": 4.738091502077269e-09, "epoch": 2.958715596330275, "percentage": 98.75, "elapsed_time": "22:35:29", "remaining_time": "0:17:06"}
|
1506 |
+
{"current_steps": 1506, "total_steps": 1524, "loss": 0.4122, "lr": 4.252538785248228e-09, "epoch": 2.960681520314548, "percentage": 98.82, "elapsed_time": "22:36:22", "remaining_time": "0:16:12"}
|
1507 |
+
{"current_steps": 1507, "total_steps": 1524, "loss": 0.4288, "lr": 3.793217689008199e-09, "epoch": 2.9626474442988204, "percentage": 98.88, "elapsed_time": "22:37:15", "remaining_time": "0:15:18"}
|
1508 |
+
{"current_steps": 1508, "total_steps": 1524, "loss": 0.4153, "lr": 3.360130625155722e-09, "epoch": 2.964613368283093, "percentage": 98.95, "elapsed_time": "22:38:10", "remaining_time": "0:14:24"}
|
1509 |
+
{"current_steps": 1509, "total_steps": 1524, "loss": 0.4211, "lr": 2.9532798677395226e-09, "epoch": 2.9665792922673657, "percentage": 99.02, "elapsed_time": "22:39:04", "remaining_time": "0:13:30"}
|
1510 |
+
{"current_steps": 1510, "total_steps": 1524, "loss": 0.4123, "lr": 2.5726675530479695e-09, "epoch": 2.968545216251638, "percentage": 99.08, "elapsed_time": "22:39:58", "remaining_time": "0:12:36"}
|
1511 |
+
{"current_steps": 1511, "total_steps": 1524, "loss": 0.4341, "lr": 2.21829567959686e-09, "epoch": 2.970511140235911, "percentage": 99.15, "elapsed_time": "22:40:52", "remaining_time": "0:11:42"}
|
1512 |
+
{"current_steps": 1512, "total_steps": 1524, "loss": 0.4095, "lr": 1.8901661081172084e-09, "epoch": 2.9724770642201834, "percentage": 99.21, "elapsed_time": "22:41:46", "remaining_time": "0:10:48"}
|
1513 |
+
{"current_steps": 1513, "total_steps": 1524, "loss": 0.4119, "lr": 1.5882805615496931e-09, "epoch": 2.974442988204456, "percentage": 99.28, "elapsed_time": "22:42:40", "remaining_time": "0:09:54"}
|
1514 |
+
{"current_steps": 1514, "total_steps": 1524, "loss": 0.4085, "lr": 1.312640625030781e-09, "epoch": 2.9764089121887287, "percentage": 99.34, "elapsed_time": "22:43:34", "remaining_time": "0:09:00"}
|
1515 |
+
{"current_steps": 1515, "total_steps": 1524, "loss": 0.4281, "lr": 1.0632477458888401e-09, "epoch": 2.9783748361730016, "percentage": 99.41, "elapsed_time": "22:44:28", "remaining_time": "0:08:06"}
|
1516 |
+
{"current_steps": 1516, "total_steps": 1524, "loss": 0.4218, "lr": 8.401032336330384e-10, "epoch": 2.980340760157274, "percentage": 99.48, "elapsed_time": "22:45:22", "remaining_time": "0:07:12"}
|
1517 |
+
{"current_steps": 1517, "total_steps": 1524, "loss": 0.4187, "lr": 6.432082599489021e-10, "epoch": 2.9823066841415464, "percentage": 99.54, "elapsed_time": "22:46:16", "remaining_time": "0:06:18"}
|
1518 |
+
{"current_steps": 1518, "total_steps": 1524, "loss": 0.429, "lr": 4.725638586894344e-10, "epoch": 2.9842726081258193, "percentage": 99.61, "elapsed_time": "22:47:10", "remaining_time": "0:05:24"}
|
1519 |
+
{"current_steps": 1519, "total_steps": 1524, "loss": 0.4134, "lr": 3.2817092587345e-10, "epoch": 2.9862385321100917, "percentage": 99.67, "elapsed_time": "22:48:04", "remaining_time": "0:04:30"}
|
1520 |
+
{"current_steps": 1520, "total_steps": 1524, "loss": 0.4259, "lr": 2.1003021967780369e-10, "epoch": 2.9882044560943646, "percentage": 99.74, "elapsed_time": "22:48:58", "remaining_time": "0:03:36"}
|
1521 |
+
{"current_steps": 1521, "total_steps": 1524, "loss": 0.4127, "lr": 1.1814236043405924e-10, "epoch": 2.990170380078637, "percentage": 99.8, "elapsed_time": "22:49:51", "remaining_time": "0:02:42"}
|
1522 |
+
{"current_steps": 1522, "total_steps": 1524, "loss": 0.4284, "lr": 5.250783062682452e-11, "epoch": 2.9921363040629094, "percentage": 99.87, "elapsed_time": "22:50:45", "remaining_time": "0:01:48"}
|
1523 |
+
{"current_steps": 1523, "total_steps": 1524, "loss": 0.4265, "lr": 1.3126974888200139e-11, "epoch": 2.9941022280471823, "percentage": 99.93, "elapsed_time": "22:51:38", "remaining_time": "0:00:54"}
|
1524 |
+
{"current_steps": 1524, "total_steps": 1524, "loss": 0.4213, "lr": 0.0, "epoch": 2.9960681520314547, "percentage": 100.0, "elapsed_time": "22:52:31", "remaining_time": "0:00:00"}
|
1525 |
+
{"current_steps": 1524, "total_steps": 1524, "epoch": 2.9960681520314547, "percentage": 100.0, "elapsed_time": "22:53:24", "remaining_time": "0:00:00"}
|