kweinmeister commited on
Commit
fb940a7
·
verified ·
1 Parent(s): ebaadec

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -3,8 +3,6 @@
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google/gemma-2-27b-it",
5
  "bias": "none",
6
- "eva_config": null,
7
- "exclude_modules": null,
8
  "fan_in_fan_out": null,
9
  "inference_mode": true,
10
  "init_lora_weights": true,
@@ -12,8 +10,7 @@
12
  "layers_pattern": null,
13
  "layers_to_transform": null,
14
  "loftq_config": {},
15
- "lora_alpha": 16,
16
- "lora_bias": false,
17
  "lora_dropout": 0.05,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
@@ -23,12 +20,12 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "o_proj",
27
- "gate_proj",
28
  "v_proj",
29
- "down_proj",
30
  "k_proj",
 
31
  "up_proj",
 
32
  "q_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
 
3
  "auto_mapping": null,
4
  "base_model_name_or_path": "google/gemma-2-27b-it",
5
  "bias": "none",
 
 
6
  "fan_in_fan_out": null,
7
  "inference_mode": true,
8
  "init_lora_weights": true,
 
10
  "layers_pattern": null,
11
  "layers_to_transform": null,
12
  "loftq_config": {},
13
+ "lora_alpha": 64,
 
14
  "lora_dropout": 0.05,
15
  "megatron_config": null,
16
  "megatron_core": "megatron.core",
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
 
23
  "v_proj",
24
+ "gate_proj",
25
  "k_proj",
26
+ "o_proj",
27
  "up_proj",
28
+ "down_proj",
29
  "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f3d6bb0152d9248d4d8c5595dbcc30c73c8ae1e34f03c387d8f1babd7e5d511
3
  size 456807968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64ee69a6b5ed2d91b48a6efdebe8a533cc37db75600ebcf8b786a1a0a22eab23
3
  size 456807968
config.json CHANGED
@@ -27,7 +27,7 @@
27
  "_load_in_4bit": true,
28
  "_load_in_8bit": false,
29
  "bnb_4bit_compute_dtype": "bfloat16",
30
- "bnb_4bit_quant_storage": "uint8",
31
  "bnb_4bit_quant_type": "nf4",
32
  "bnb_4bit_use_double_quant": true,
33
  "llm_int8_enable_fp32_cpu_offload": false,
@@ -44,7 +44,7 @@
44
  "sliding_window": 4096,
45
  "sliding_window_size": 4096,
46
  "torch_dtype": "bfloat16",
47
- "transformers_version": "4.47.1",
48
  "use_cache": false,
49
  "vocab_size": 256000
50
  }
 
27
  "_load_in_4bit": true,
28
  "_load_in_8bit": false,
29
  "bnb_4bit_compute_dtype": "bfloat16",
30
+ "bnb_4bit_quant_storage": "bfloat16",
31
  "bnb_4bit_quant_type": "nf4",
32
  "bnb_4bit_use_double_quant": true,
33
  "llm_int8_enable_fp32_cpu_offload": false,
 
44
  "sliding_window": 4096,
45
  "sliding_window_size": 4096,
46
  "torch_dtype": "bfloat16",
47
+ "transformers_version": "4.46.3",
48
  "use_cache": false,
49
  "vocab_size": 256000
50
  }
tokenizer_config.json CHANGED
@@ -2003,7 +2003,6 @@
2003
  "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
2004
  "clean_up_tokenization_spaces": false,
2005
  "eos_token": "<eos>",
2006
- "extra_special_tokens": {},
2007
  "model_max_length": 1000000000000000019884624838656,
2008
  "pad_token": "<pad>",
2009
  "sp_model_kwargs": {},
 
2003
  "chat_template": "{{ bos_token }}{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\n' + message['content'] | trim + '<end_of_turn>\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\n'}}{% endif %}",
2004
  "clean_up_tokenization_spaces": false,
2005
  "eos_token": "<eos>",
 
2006
  "model_max_length": 1000000000000000019884624838656,
2007
  "pad_token": "<pad>",
2008
  "sp_model_kwargs": {},
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a6b229a80811553a8917ed8e0f624c6e8ad3674fe3237b402de0aa44dd4c70d
3
- size 7992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf34f757061c10a83a328ef66420695ee72014af4919f9aa990773d92f93b3c9
3
+ size 8120