Training in progress, step 600
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 295488936
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a9fe368cada65a1d14e0d43824db3cfa6564a7e9352735addd8e143a521f036
|
3 |
size 295488936
|
trainer_log.jsonl
CHANGED
@@ -76,3 +76,14 @@
|
|
76 |
{"current_steps": 490, "total_steps": 610, "loss": 0.1348, "lr": 1.1332466114513512e-05, "epoch": 0.8032786885245902, "percentage": 80.33, "elapsed_time": "0:16:36", "remaining_time": "0:04:04"}
|
77 |
{"current_steps": 500, "total_steps": 610, "loss": 0.1065, "lr": 9.582812136100783e-06, "epoch": 0.819672131147541, "percentage": 81.97, "elapsed_time": "0:18:41", "remaining_time": "0:04:06"}
|
78 |
{"current_steps": 500, "total_steps": 610, "eval_loss": 0.1266276091337204, "epoch": 0.819672131147541, "percentage": 81.97, "elapsed_time": "0:19:43", "remaining_time": "0:04:20"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
76 |
{"current_steps": 490, "total_steps": 610, "loss": 0.1348, "lr": 1.1332466114513512e-05, "epoch": 0.8032786885245902, "percentage": 80.33, "elapsed_time": "0:16:36", "remaining_time": "0:04:04"}
|
77 |
{"current_steps": 500, "total_steps": 610, "loss": 0.1065, "lr": 9.582812136100783e-06, "epoch": 0.819672131147541, "percentage": 81.97, "elapsed_time": "0:18:41", "remaining_time": "0:04:06"}
|
78 |
{"current_steps": 500, "total_steps": 610, "eval_loss": 0.1266276091337204, "epoch": 0.819672131147541, "percentage": 81.97, "elapsed_time": "0:19:43", "remaining_time": "0:04:20"}
|
79 |
+
{"current_steps": 510, "total_steps": 610, "loss": 0.114, "lr": 7.965471193905954e-06, "epoch": 0.8360655737704918, "percentage": 83.61, "elapsed_time": "0:21:57", "remaining_time": "0:04:18"}
|
80 |
+
{"current_steps": 520, "total_steps": 610, "loss": 0.1114, "lr": 6.4857379484922375e-06, "epoch": 0.8524590163934426, "percentage": 85.25, "elapsed_time": "0:23:35", "remaining_time": "0:04:05"}
|
81 |
+
{"current_steps": 530, "total_steps": 610, "loss": 0.1265, "lr": 5.148456576529081e-06, "epoch": 0.8688524590163934, "percentage": 86.89, "elapsed_time": "0:25:41", "remaining_time": "0:03:52"}
|
82 |
+
{"current_steps": 540, "total_steps": 610, "loss": 0.1418, "lr": 3.958004912496127e-06, "epoch": 0.8852459016393442, "percentage": 88.52, "elapsed_time": "0:27:29", "remaining_time": "0:03:33"}
|
83 |
+
{"current_steps": 550, "total_steps": 610, "loss": 0.1555, "lr": 2.918280117043709e-06, "epoch": 0.9016393442622951, "percentage": 90.16, "elapsed_time": "0:29:12", "remaining_time": "0:03:11"}
|
84 |
+
{"current_steps": 560, "total_steps": 610, "loss": 0.1195, "lr": 2.032685918926508e-06, "epoch": 0.9180327868852459, "percentage": 91.8, "elapsed_time": "0:31:02", "remaining_time": "0:02:46"}
|
85 |
+
{"current_steps": 570, "total_steps": 610, "loss": 0.1395, "lr": 1.3041214722768035e-06, "epoch": 0.9344262295081968, "percentage": 93.44, "elapsed_time": "0:32:44", "remaining_time": "0:02:17"}
|
86 |
+
{"current_steps": 580, "total_steps": 610, "loss": 0.1296, "lr": 7.349718656945504e-07, "epoch": 0.9508196721311475, "percentage": 95.08, "elapsed_time": "0:34:35", "remaining_time": "0:01:47"}
|
87 |
+
{"current_steps": 590, "total_steps": 610, "loss": 0.1411, "lr": 3.271003142248652e-07, "epoch": 0.9672131147540983, "percentage": 96.72, "elapsed_time": "0:36:16", "remaining_time": "0:01:13"}
|
88 |
+
{"current_steps": 600, "total_steps": 610, "loss": 0.1174, "lr": 8.184205978370996e-08, "epoch": 0.9836065573770492, "percentage": 98.36, "elapsed_time": "0:37:59", "remaining_time": "0:00:37"}
|
89 |
+
{"current_steps": 600, "total_steps": 610, "eval_loss": 0.12527307868003845, "epoch": 0.9836065573770492, "percentage": 98.36, "elapsed_time": "0:39:01", "remaining_time": "0:00:39"}
|