MaiAhmed commited on
Commit
bfa9637
·
verified ·
1 Parent(s): c18f6f5

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -13,30 +13,27 @@
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
- "lora_alpha": 16,
17
  "lora_bias": false,
18
  "lora_dropout": 0.05,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
- "modules_to_save": [
22
- "lm_head",
23
- "embed_tokens"
24
- ],
25
  "peft_type": "LORA",
26
  "r": 16,
27
  "rank_pattern": {},
28
  "revision": null,
29
  "target_modules": [
30
- "down_proj",
31
- "k_proj",
32
  "fc1",
33
- "o_proj",
34
- "q_proj",
35
  "fc2",
36
- "gate_proj",
37
- "up_proj",
38
  "out_proj",
39
- "v_proj"
 
 
 
 
40
  ],
41
  "task_type": "CAUSAL_LM",
42
  "trainable_token_indices": null,
 
13
  "layers_pattern": null,
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
+ "lora_alpha": 32,
17
  "lora_bias": false,
18
  "lora_dropout": 0.05,
19
  "megatron_config": null,
20
  "megatron_core": "megatron.core",
21
+ "modules_to_save": null,
 
 
 
22
  "peft_type": "LORA",
23
  "r": 16,
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
 
 
27
  "fc1",
 
 
28
  "fc2",
29
+ "q_proj",
30
+ "k_proj",
31
  "out_proj",
32
+ "o_proj",
33
+ "v_proj",
34
+ "up_proj",
35
+ "gate_proj",
36
+ "down_proj"
37
  ],
38
  "task_type": "CAUSAL_LM",
39
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5437a85ef905468b3230f19d00fd90f28810c2791599fe45ec77b92eb655957
3
- size 2839124552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2f4a075f1381b6bb04cc471e7eb8466ebffa1425a4b303d4920947b867a1664
3
+ size 154114368
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7264346be152c9c1da00ecffebf96554a557d4bfe3502bdb21e4bece2d1a742e
3
- size 5688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c20bef00ffc01a53cf9b560ca51c42803e0cdb647cd2778efd7f0f66a4cb3aec
3
+ size 5752