dharsan01 commited on
Commit
9f3f31c
·
verified ·
1 Parent(s): 665a641

Training in progress, step 10

Browse files
adapter_config.json CHANGED
@@ -3,6 +3,7 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "vilsonrodrigues/falcon-7b-instruct-sharded",
5
  "bias": "none",
 
6
  "exclude_modules": null,
7
  "fan_in_fan_out": false,
8
  "inference_mode": true,
@@ -12,6 +13,7 @@
12
  "layers_to_transform": null,
13
  "loftq_config": {},
14
  "lora_alpha": 32,
 
15
  "lora_dropout": 0.05,
16
  "megatron_config": null,
17
  "megatron_core": "megatron.core",
@@ -21,10 +23,10 @@
21
  "rank_pattern": {},
22
  "revision": null,
23
  "target_modules": [
24
- "dense_4h_to_h",
25
  "dense",
26
  "dense_h_to_4h",
27
- "query_key_value"
 
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "vilsonrodrigues/falcon-7b-instruct-sharded",
5
  "bias": "none",
6
+ "eva_config": null,
7
  "exclude_modules": null,
8
  "fan_in_fan_out": false,
9
  "inference_mode": true,
 
13
  "layers_to_transform": null,
14
  "loftq_config": {},
15
  "lora_alpha": 32,
16
+ "lora_bias": false,
17
  "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
26
  "dense",
27
  "dense_h_to_4h",
28
+ "query_key_value",
29
+ "dense_4h_to_h"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af93310b50cfc41d5abc25ca8b4e6d34c3cbcb7fc5814a8dd83c0b3d5dca9769
3
  size 261131840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2f3449228776f84f4a79a30ddfdab7df154a8b797d111c75d1bdb9a3878dc8b
3
  size 261131840
runs/Dec12_10-57-19_493b1151e23a/events.out.tfevents.1734001040.493b1151e23a.470.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08ac6a2795b530e2e01eede304175fa8a0aa17ac82e6eb846fd1b24e921bc8a4
3
+ size 6856
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1116ef3fe976cb5662d5a4d2533136ba6484cae4e85e529ec6d771a571d60c9b
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:864bd1a9240960deed89becb4ec6c983c98bc54d148a373a1c666db47a5040ec
3
  size 5560