suhani-sarvam commited on
Commit
a65c10a
·
verified ·
1 Parent(s): 8289078

Training in progress, step 145

Browse files
adapter_config.json CHANGED
@@ -23,12 +23,12 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "q_proj",
27
  "gate_proj",
 
 
 
28
  "o_proj",
29
  "v_proj",
30
- "down_proj",
31
- "up_proj",
32
  "k_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
 
26
  "gate_proj",
27
+ "q_proj",
28
+ "up_proj",
29
+ "down_proj",
30
  "o_proj",
31
  "v_proj",
 
 
32
  "k_proj"
33
  ],
34
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:05e236eab30054f522ca48df2f086c2139b2b50d1cc6fba248f28c0de6aaf5f4
3
- size 383569528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0000e9eaae249b63b6c51005803c609b3ed411a71e3c9a45ca87be6b026f6358
3
+ size 941420376
special_tokens_map.json CHANGED
@@ -1,4 +1,13 @@
1
  {
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
@@ -13,7 +22,7 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": "<unk>",
17
  "unk_token": {
18
  "content": "<unk>",
19
  "lstrip": false,
 
1
  {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ }
10
+ ],
11
  "bos_token": {
12
  "content": "<s>",
13
  "lstrip": false,
 
22
  "rstrip": false,
23
  "single_word": false
24
  },
25
+ "pad_token": "[PAD]",
26
  "unk_token": {
27
  "content": "<unk>",
28
  "lstrip": false,
tokenizer_config.json CHANGED
@@ -32850,8 +32850,19 @@
32850
  "rstrip": false,
32851
  "single_word": false,
32852
  "special": false
 
 
 
 
 
 
 
 
32853
  }
32854
  },
 
 
 
32855
  "bos_token": "<s>",
32856
  "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}\n{% for message in loop_messages %}\n{% if message['role'] not in ['user', 'assistant', 'tool_calls'] %}\n{{ raise_exception('Invalid role: ' + message['role'] + '. Must be user, assistant, or tool_calls.') }}\n{% endif %}\n{% if loop.index0 == 0 and system_message != false %}\n{% set content = '<<SYS>>\n' + system_message + '\n<</SYS>>\n\n' + message['content'] %}\n{% else %}\n{% set content = message['content'] %}\n{% endif %}\n{% if message['role'] == 'user' %}\n{{ bos_token + '[INST] ' + content.strip() + ' [/INST]' }}\n{% elif message['role'] == 'assistant' %}\n{{ ' ' + content.strip() + ' ' + eos_token }}\n{% elif message['role'] == 'tool_calls' %}\n{{ ' [TOOL_CALLS] ' + content.strip() + ' [/TOOL_CALLS] ' }}\n{% endif %}\n{% endfor %}",
32857
  "clean_up_tokenization_spaces": false,
@@ -32859,7 +32870,7 @@
32859
  "extra_special_tokens": {},
32860
  "legacy": false,
32861
  "model_max_length": 8192,
32862
- "pad_token": "<unk>",
32863
  "padding_side": "right",
32864
  "sp_model_kwargs": {},
32865
  "spaces_between_special_tokens": false,
 
32850
  "rstrip": false,
32851
  "single_word": false,
32852
  "special": false
32853
+ },
32854
+ "68096": {
32855
+ "content": "[PAD]",
32856
+ "lstrip": false,
32857
+ "normalized": false,
32858
+ "rstrip": false,
32859
+ "single_word": false,
32860
+ "special": true
32861
  }
32862
  },
32863
+ "additional_special_tokens": [
32864
+ "[PAD]"
32865
+ ],
32866
  "bos_token": "<s>",
32867
  "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}\n{% for message in loop_messages %}\n{% if message['role'] not in ['user', 'assistant', 'tool_calls'] %}\n{{ raise_exception('Invalid role: ' + message['role'] + '. Must be user, assistant, or tool_calls.') }}\n{% endif %}\n{% if loop.index0 == 0 and system_message != false %}\n{% set content = '<<SYS>>\n' + system_message + '\n<</SYS>>\n\n' + message['content'] %}\n{% else %}\n{% set content = message['content'] %}\n{% endif %}\n{% if message['role'] == 'user' %}\n{{ bos_token + '[INST] ' + content.strip() + ' [/INST]' }}\n{% elif message['role'] == 'assistant' %}\n{{ ' ' + content.strip() + ' ' + eos_token }}\n{% elif message['role'] == 'tool_calls' %}\n{{ ' [TOOL_CALLS] ' + content.strip() + ' [/TOOL_CALLS] ' }}\n{% endif %}\n{% endfor %}",
32868
  "clean_up_tokenization_spaces": false,
 
32870
  "extra_special_tokens": {},
32871
  "legacy": false,
32872
  "model_max_length": 8192,
32873
+ "pad_token": "[PAD]",
32874
  "padding_side": "right",
32875
  "sp_model_kwargs": {},
32876
  "spaces_between_special_tokens": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca331fe95720e05f38064944932d8543f0c9ce884d869794497e5236b3d18763
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba593b17db62769f48cad2733568a19f9d173e99ae9d8956ed8b3f4f7f9c8598
3
  size 5496