Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4180df440ce5cd18dd6171e2e284ed0aaa2831f88cd375288774c1bf9e60bc93
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cda9837a8d6899eec86fc86dc8328c7f71dbef26017e41636b038f918b03ed84
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6fa5b55a76bf348f8c06e0c7d4ffad9f20760ee13d12913c11d0c7436155575
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a899bcd13f961e2731ea151e30259e62b5c6972f2a43128fcab9c638d6f64217
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -10,3 +10,8 @@
|
|
10 |
{"current_steps": 10, "total_steps": 25, "loss": 0.6852, "lr": 7.703204087277989e-06, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "0:12:27", "remaining_time": "0:18:40"}
|
11 |
{"current_steps": 11, "total_steps": 25, "loss": 0.6784, "lr": 7.0770750650094335e-06, "epoch": 2.2, "percentage": 44.0, "elapsed_time": "0:14:41", "remaining_time": "0:18:41"}
|
12 |
{"current_steps": 12, "total_steps": 25, "loss": 0.6349, "lr": 6.408662784207149e-06, "epoch": 2.4, "percentage": 48.0, "elapsed_time": "0:15:51", "remaining_time": "0:17:10"}
|
|
|
|
|
|
|
|
|
|
|
|
10 |
{"current_steps": 10, "total_steps": 25, "loss": 0.6852, "lr": 7.703204087277989e-06, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "0:12:27", "remaining_time": "0:18:40"}
|
11 |
{"current_steps": 11, "total_steps": 25, "loss": 0.6784, "lr": 7.0770750650094335e-06, "epoch": 2.2, "percentage": 44.0, "elapsed_time": "0:14:41", "remaining_time": "0:18:41"}
|
12 |
{"current_steps": 12, "total_steps": 25, "loss": 0.6349, "lr": 6.408662784207149e-06, "epoch": 2.4, "percentage": 48.0, "elapsed_time": "0:15:51", "remaining_time": "0:17:10"}
|
13 |
+
{"current_steps": 13, "total_steps": 25, "loss": 0.6179, "lr": 5.711574191366427e-06, "epoch": 2.6, "percentage": 52.0, "elapsed_time": "0:17:11", "remaining_time": "0:15:52"}
|
14 |
+
{"current_steps": 14, "total_steps": 25, "loss": 0.6468, "lr": 5e-06, "epoch": 2.8, "percentage": 56.0, "elapsed_time": "0:18:10", "remaining_time": "0:14:16"}
|
15 |
+
{"current_steps": 15, "total_steps": 25, "loss": 0.6264, "lr": 4.2884258086335755e-06, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "0:19:20", "remaining_time": "0:12:53"}
|
16 |
+
{"current_steps": 16, "total_steps": 25, "loss": 0.5678, "lr": 3.5913372157928515e-06, "epoch": 3.2, "percentage": 64.0, "elapsed_time": "0:21:32", "remaining_time": "0:12:07"}
|
17 |
+
{"current_steps": 17, "total_steps": 25, "loss": 0.6467, "lr": 2.9229249349905686e-06, "epoch": 3.4, "percentage": 68.0, "elapsed_time": "0:22:49", "remaining_time": "0:10:44"}
|