Jlonge4/outputs
Browse files- README.md +1 -1
- adapter_config.json +5 -5
- adapter_model.safetensors +1 -1
- runs/Jun13_00-37-43_ec2c06351a1f/events.out.tfevents.1718239065.ec2c06351a1f.720.0 +3 -0
- runs/Jun13_00-41-37_ec2c06351a1f/events.out.tfevents.1718239298.ec2c06351a1f.2444.0 +3 -0
- runs/Jun13_00-41-54_ec2c06351a1f/events.out.tfevents.1718239315.ec2c06351a1f.2444.1 +3 -0
- runs/Jun13_00-42-35_ec2c06351a1f/events.out.tfevents.1718239357.ec2c06351a1f.2882.0 +3 -0
- training_args.bin +1 -1
README.md
CHANGED
@@ -44,7 +44,7 @@ The following hyperparameters were used during training:
|
|
44 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
45 |
- lr_scheduler_type: linear
|
46 |
- lr_scheduler_warmup_steps: 10
|
47 |
-
- training_steps:
|
48 |
- mixed_precision_training: Native AMP
|
49 |
|
50 |
### Training results
|
|
|
44 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
45 |
- lr_scheduler_type: linear
|
46 |
- lr_scheduler_warmup_steps: 10
|
47 |
+
- training_steps: 20
|
48 |
- mixed_precision_training: Native AMP
|
49 |
|
50 |
### Training results
|
adapter_config.json
CHANGED
@@ -20,13 +20,13 @@
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
-
"
|
24 |
-
"v_proj",
|
25 |
-
"q_proj",
|
26 |
"k_proj",
|
|
|
|
|
27 |
"down_proj",
|
28 |
-
"
|
29 |
-
"
|
30 |
],
|
31 |
"task_type": "CAUSAL_LM",
|
32 |
"use_dora": false,
|
|
|
20 |
"rank_pattern": {},
|
21 |
"revision": null,
|
22 |
"target_modules": [
|
23 |
+
"gate_proj",
|
|
|
|
|
24 |
"k_proj",
|
25 |
+
"q_proj",
|
26 |
+
"up_proj",
|
27 |
"down_proj",
|
28 |
+
"v_proj",
|
29 |
+
"o_proj"
|
30 |
],
|
31 |
"task_type": "CAUSAL_LM",
|
32 |
"use_dora": false,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 71320216
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21b26c4d2931449acf14c09b0c1c3a4c0fe7e486f89e2b9e7a70bc9ddfda41f4
|
3 |
size 71320216
|
runs/Jun13_00-37-43_ec2c06351a1f/events.out.tfevents.1718239065.ec2c06351a1f.720.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e320a5ec0eb4aac42b314718e08f60affd51ff82f139a6ccac59fdb8f499d7a
|
3 |
+
size 24119
|
runs/Jun13_00-41-37_ec2c06351a1f/events.out.tfevents.1718239298.ec2c06351a1f.2444.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27c577e4be80a5ab685edb9d162de6052bbb2f2f14049f673122f974114c99c7
|
3 |
+
size 10730
|
runs/Jun13_00-41-54_ec2c06351a1f/events.out.tfevents.1718239315.ec2c06351a1f.2444.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2f5b7e89a5b0e76ff91883dfa73be0345e8e589e0f9d37676a7e6ea1fc4d30b
|
3 |
+
size 4184
|
runs/Jun13_00-42-35_ec2c06351a1f/events.out.tfevents.1718239357.ec2c06351a1f.2882.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05802974ea315d2ee4f093cd3fb317920b9d12476a0a8ec60a329b4805e786b9
|
3 |
+
size 9629
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5048
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ddc2f7a0066efb4e758b012ccf06290a2498c7b11e8c15f86b37d8a4b95d4c0
|
3 |
size 5048
|