mjschock commited on
Commit
2747cd5
·
verified ·
1 Parent(s): 56890f2

End of training

Browse files
README.md CHANGED
@@ -49,7 +49,7 @@ The following hyperparameters were used during training:
49
  ### Framework versions
50
 
51
  - PEFT 0.15.2
52
- - Transformers 4.51.3
53
- - Pytorch 2.7.0+cu126
54
  - Datasets 3.6.0
55
  - Tokenizers 0.21.1
 
49
  ### Framework versions
50
 
51
  - PEFT 0.15.2
52
+ - Transformers 4.52.4
53
+ - Pytorch 2.7.1+cu126
54
  - Datasets 3.6.0
55
  - Tokenizers 0.21.1
adapter_config.json CHANGED
@@ -24,13 +24,13 @@
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "o_proj",
28
- "down_proj",
29
  "gate_proj",
30
  "up_proj",
31
- "k_proj",
32
  "q_proj",
33
- "v_proj"
 
34
  ],
35
  "task_type": "CAUSAL_LM",
36
  "trainable_token_indices": null,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
+ "v_proj",
28
+ "k_proj",
29
  "gate_proj",
30
  "up_proj",
 
31
  "q_proj",
32
+ "down_proj",
33
+ "o_proj"
34
  ],
35
  "task_type": "CAUSAL_LM",
36
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85eb56124f76082a064f2885f42f36981f79e9c57eb79b6e734b35b2d6299611
3
  size 11608320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e812953d3bb61a861db185119ec65067b680d88f06ac7066365fac6bf797a20d
3
  size 11608320
runs/Jun06_11-42-41_pop-os/events.out.tfevents.1749235361.pop-os.2938286.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dcd713b101eef24b002ef41fa2379eb0a7a71077db254432eacddf148144923
3
+ size 17841
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a90b3476b336213adf9b3010fa5a7133182fc5577c92ae0a139d6420ab445a46
3
- size 5841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c67bd46eb2a07c5b5bfd801ee7cc45bc58016537f486308a9f5b7024ae7a8e04
3
+ size 5777