Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8bad1e88066e430e82d2a4d57b4480f07eefb85ae89aed4e479e898a516071f
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5fcc07459b7621181961c5cf1cb0fbb1102f532089133b7b0a98c70601a3b414
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e169ae1128b3378bcccfa175ca5f73143171336ffd6cb24382dea2647c8897ae
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c846cede97c1820b8b03ce63d1d78de4e27207395b44ed95df0f8d90dfd99b1
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -15,3 +15,8 @@
|
|
15 |
{"current_steps": 15, "total_steps": 25, "loss": 0.6264, "lr": 4.2884258086335755e-06, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "0:19:20", "remaining_time": "0:12:53"}
|
16 |
{"current_steps": 16, "total_steps": 25, "loss": 0.5678, "lr": 3.5913372157928515e-06, "epoch": 3.2, "percentage": 64.0, "elapsed_time": "0:21:32", "remaining_time": "0:12:07"}
|
17 |
{"current_steps": 17, "total_steps": 25, "loss": 0.6467, "lr": 2.9229249349905686e-06, "epoch": 3.4, "percentage": 68.0, "elapsed_time": "0:22:49", "remaining_time": "0:10:44"}
|
|
|
|
|
|
|
|
|
|
|
|
15 |
{"current_steps": 15, "total_steps": 25, "loss": 0.6264, "lr": 4.2884258086335755e-06, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "0:19:20", "remaining_time": "0:12:53"}
|
16 |
{"current_steps": 16, "total_steps": 25, "loss": 0.5678, "lr": 3.5913372157928515e-06, "epoch": 3.2, "percentage": 64.0, "elapsed_time": "0:21:32", "remaining_time": "0:12:07"}
|
17 |
{"current_steps": 17, "total_steps": 25, "loss": 0.6467, "lr": 2.9229249349905686e-06, "epoch": 3.4, "percentage": 68.0, "elapsed_time": "0:22:49", "remaining_time": "0:10:44"}
|
18 |
+
{"current_steps": 18, "total_steps": 25, "loss": 0.5901, "lr": 2.296795912722014e-06, "epoch": 3.6, "percentage": 72.0, "elapsed_time": "0:24:11", "remaining_time": "0:09:24"}
|
19 |
+
{"current_steps": 19, "total_steps": 25, "loss": 0.5917, "lr": 1.7256963302735752e-06, "epoch": 3.8, "percentage": 76.0, "elapsed_time": "0:24:57", "remaining_time": "0:07:52"}
|
20 |
+
{"current_steps": 20, "total_steps": 25, "loss": 0.5287, "lr": 1.2212521282287093e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "0:25:57", "remaining_time": "0:06:29"}
|
21 |
+
{"current_steps": 21, "total_steps": 25, "loss": 0.5862, "lr": 7.937323358440935e-07, "epoch": 4.2, "percentage": 84.0, "elapsed_time": "0:28:11", "remaining_time": "0:05:22"}
|
22 |
+
{"current_steps": 22, "total_steps": 25, "loss": 0.5381, "lr": 4.5184002322740784e-07, "epoch": 4.4, "percentage": 88.0, "elapsed_time": "0:29:25", "remaining_time": "0:04:00"}
|