Training in progress, step 420
Browse files- adapter_config.json +5 -5
- adapter_model.safetensors +1 -1
- trainer_log.jsonl +6 -12
- training_args.bin +1 -1
adapter_config.json
CHANGED
@@ -23,13 +23,13 @@
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
26 |
-
"k_proj",
|
27 |
-
"q_proj",
|
28 |
-
"down_proj",
|
29 |
-
"gate_proj",
|
30 |
"v_proj",
|
31 |
"up_proj",
|
32 |
-
"o_proj"
|
|
|
|
|
|
|
|
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
|
|
23 |
"rank_pattern": {},
|
24 |
"revision": null,
|
25 |
"target_modules": [
|
|
|
|
|
|
|
|
|
26 |
"v_proj",
|
27 |
"up_proj",
|
28 |
+
"o_proj",
|
29 |
+
"down_proj",
|
30 |
+
"k_proj",
|
31 |
+
"gate_proj",
|
32 |
+
"q_proj"
|
33 |
],
|
34 |
"task_type": "CAUSAL_LM",
|
35 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 80792456
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8130e83528e67064027d9f72500e72b9c8f84725905e2ed7556b045263bd1cd
|
3 |
size 80792456
|
trainer_log.jsonl
CHANGED
@@ -1,12 +1,6 @@
|
|
1 |
-
{"current_steps":
|
2 |
-
{"current_steps":
|
3 |
-
{"current_steps":
|
4 |
-
{"current_steps":
|
5 |
-
{"current_steps":
|
6 |
-
{"current_steps":
|
7 |
-
{"current_steps": 310, "total_steps": 2550, "loss": 0.5897, "lr": 0.00029157806983015394, "epoch": 0.3644914756025867, "percentage": 12.16, "elapsed_time": "5:55:57", "remaining_time": "1 day, 18:52:05"}
|
8 |
-
{"current_steps": 320, "total_steps": 2550, "loss": 0.5936, "lr": 0.00029094675704057724, "epoch": 0.37624926513815404, "percentage": 12.55, "elapsed_time": "6:46:54", "remaining_time": "1 day, 23:15:39"}
|
9 |
-
{"current_steps": 330, "total_steps": 2550, "loss": 0.5876, "lr": 0.00029029336411618865, "epoch": 0.3880070546737213, "percentage": 12.94, "elapsed_time": "7:37:50", "remaining_time": "2 days, 3:19:59"}
|
10 |
-
{"current_steps": 340, "total_steps": 2550, "loss": 0.5884, "lr": 0.0002896179934148158, "epoch": 0.39976484420928865, "percentage": 13.33, "elapsed_time": "8:28:43", "remaining_time": "2 days, 7:06:42"}
|
11 |
-
{"current_steps": 350, "total_steps": 2550, "loss": 0.5846, "lr": 0.0002889207507372337, "epoch": 0.411522633744856, "percentage": 13.73, "elapsed_time": "9:19:33", "remaining_time": "2 days, 10:37:15"}
|
12 |
-
{"current_steps": 360, "total_steps": 2550, "loss": 0.5862, "lr": 0.0002882017453105906, "epoch": 0.42328042328042326, "percentage": 14.12, "elapsed_time": "10:10:28", "remaining_time": "2 days, 13:53:43"}
|
|
|
1 |
+
{"current_steps": 370, "total_steps": 2550, "loss": 0.5724, "lr": 0.0002865363126582549, "epoch": 0.4350382128159906, "percentage": 14.51, "elapsed_time": "0:51:02", "remaining_time": "5:00:45"}
|
2 |
+
{"current_steps": 380, "total_steps": 2550, "loss": 0.589, "lr": 0.00028575266221296395, "epoch": 0.4467960023515579, "percentage": 14.9, "elapsed_time": "1:42:04", "remaining_time": "9:42:51"}
|
3 |
+
{"current_steps": 390, "total_steps": 2550, "loss": 0.5887, "lr": 0.00028494798058030713, "epoch": 0.4585537918871252, "percentage": 15.29, "elapsed_time": "2:33:10", "remaining_time": "14:08:22"}
|
4 |
+
{"current_steps": 400, "total_steps": 2550, "loss": 0.5764, "lr": 0.0002841223924238447, "epoch": 0.4703115814226925, "percentage": 15.69, "elapsed_time": "3:24:19", "remaining_time": "18:18:12"}
|
5 |
+
{"current_steps": 410, "total_steps": 2550, "loss": 0.5808, "lr": 0.0002832760256460349, "epoch": 0.48206937095825986, "percentage": 16.08, "elapsed_time": "4:15:30", "remaining_time": "22:13:39"}
|
6 |
+
{"current_steps": 420, "total_steps": 2550, "loss": 0.5733, "lr": 0.00028240901136841886, "epoch": 0.49382716049382713, "percentage": 16.47, "elapsed_time": "5:07:05", "remaining_time": "1 day, 1:57:23"}
|
|
|
|
|
|
|
|
|
|
|
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5752
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12eac2dba3df35b6c9379924bc2a67b96e3d059dafdc119c9ec63ba9d7c614e2
|
3 |
size 5752
|