Training in progress, step 16324
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +5 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 29034840
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6dd27678e81e52b77b203ee21948888d64924194d564a7da5da8608977a649ef
|
3 |
size 29034840
|
trainer_log.jsonl
CHANGED
@@ -3607,3 +3607,8 @@
|
|
3607 |
{"current_steps": 16295, "total_steps": 16324, "loss": 0.1816, "lr": 8.629366747170408e-10, "epoch": 1.9963553949343051, "percentage": 99.82, "elapsed_time": "7:57:19", "remaining_time": "0:00:50", "throughput": 3808.74, "total_tokens": 109078888}
|
3608 |
{"current_steps": 16300, "total_steps": 16324, "loss": 0.2158, "lr": 5.910249407270474e-10, "epoch": 1.9969679336008086, "percentage": 99.85, "elapsed_time": "7:58:17", "remaining_time": "0:00:42", "throughput": 3802.14, "total_tokens": 109112120}
|
3609 |
{"current_steps": 16300, "total_steps": 16324, "eval_loss": 0.11464700102806091, "epoch": 1.9969679336008086, "percentage": 99.85, "elapsed_time": "7:58:36", "remaining_time": "0:00:42", "throughput": 3799.61, "total_tokens": 109112120}
|
|
|
|
|
|
|
|
|
|
|
|
3607 |
{"current_steps": 16295, "total_steps": 16324, "loss": 0.1816, "lr": 8.629366747170408e-10, "epoch": 1.9963553949343051, "percentage": 99.82, "elapsed_time": "7:57:19", "remaining_time": "0:00:50", "throughput": 3808.74, "total_tokens": 109078888}
|
3608 |
{"current_steps": 16300, "total_steps": 16324, "loss": 0.2158, "lr": 5.910249407270474e-10, "epoch": 1.9969679336008086, "percentage": 99.85, "elapsed_time": "7:58:17", "remaining_time": "0:00:42", "throughput": 3802.14, "total_tokens": 109112120}
|
3609 |
{"current_steps": 16300, "total_steps": 16324, "eval_loss": 0.11464700102806091, "epoch": 1.9969679336008086, "percentage": 99.85, "elapsed_time": "7:58:36", "remaining_time": "0:00:42", "throughput": 3799.61, "total_tokens": 109112120}
|
3610 |
+
{"current_steps": 16305, "total_steps": 16324, "loss": 0.2376, "lr": 3.7041694531114723e-10, "epoch": 1.9975804722673118, "percentage": 99.88, "elapsed_time": "7:59:40", "remaining_time": "0:00:33", "throughput": 3792.37, "total_tokens": 109145312}
|
3611 |
+
{"current_steps": 16310, "total_steps": 16324, "loss": 0.2031, "lr": 2.0111291483271288e-10, "epoch": 1.9981930109338153, "percentage": 99.91, "elapsed_time": "8:00:38", "remaining_time": "0:00:24", "throughput": 3785.87, "total_tokens": 109179312}
|
3612 |
+
{"current_steps": 16315, "total_steps": 16324, "loss": 0.2135, "lr": 8.311302300278989e-11, "epoch": 1.9988055496003185, "percentage": 99.94, "elapsed_time": "8:01:37", "remaining_time": "0:00:15", "throughput": 3779.33, "total_tokens": 109212488}
|
3613 |
+
{"current_steps": 16320, "total_steps": 16324, "loss": 0.2092, "lr": 1.6417390907852438e-11, "epoch": 1.9994180882668218, "percentage": 99.98, "elapsed_time": "8:02:35", "remaining_time": "0:00:07", "throughput": 3772.91, "total_tokens": 109246064}
|
3614 |
+
{"current_steps": 16324, "total_steps": 16324, "epoch": 1.9999081192000245, "percentage": 100.0, "elapsed_time": "8:03:27", "remaining_time": "0:00:00", "throughput": 3767.11, "total_tokens": 109273408}
|