mrcuddle commited on
Commit
5336849
1 Parent(s): 6654a62

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. config.json +8 -25
  2. special_tokens_map.json +0 -7
  3. tokenizer.json +19 -85
  4. tokenizer_config.json +13 -21
config.json CHANGED
@@ -1,32 +1,13 @@
1
  {
2
  "_commit_hash": null,
3
- "_name_or_path": "mistralai/Pixtral-12B",
4
  "architectures": [
5
  "LlavaForConditionalGeneration"
6
  ],
7
- "attention_dropout": 0.0,
8
- "bos_token_id": 1,
9
- "eos_token_id": 2,
10
- "head_dim": 128,
11
- "hidden_act": "silu",
12
- "hidden_size": 5120,
13
- "initializer_range": 0.02,
14
- "intermediate_size": 14336,
15
- "max_position_embeddings": 1024000,
16
- "model_type": "mistral",
17
- "num_attention_heads": 32,
18
- "num_hidden_layers": 40,
19
- "num_key_value_heads": 8,
20
- "rms_norm_eps": 1e-05,
21
- "rope_theta": 1000000.0,
22
- "sliding_window": null,
23
- "tie_word_embeddings": false,
24
- "torch_dtype": "bfloat16",
25
- "transformers_version": "4.44.0.dev0",
26
- "use_cache": false,
27
- "vocab_size": 131073,
28
  "image_seq_length": 1,
29
  "image_token_index": 10,
 
30
  "projector_hidden_act": "gelu",
31
  "text_config": {
32
  "hidden_size": 5120,
@@ -34,7 +15,7 @@
34
  "intermediate_size": 14336,
35
  "is_composition": true,
36
  "max_position_embeddings": 1024000,
37
- "model_type": "llava",
38
  "num_hidden_layers": 40,
39
  "num_key_value_heads": 8,
40
  "rms_norm_eps": 1e-05,
@@ -42,16 +23,18 @@
42
  "sliding_window": null,
43
  "vocab_size": 131072
44
  },
 
 
45
  "vision_config": {
46
  "head_dim": 64,
47
  "hidden_act": "silu",
48
  "image_size": 1024,
49
  "is_composition": true,
50
- "model_type": "llava",
51
  "patch_size": 16,
52
  "rope_theta": 10000.0,
53
  "tie_word_embeddings": false
54
  },
55
  "vision_feature_layer": -1,
56
  "vision_feature_select_strategy": "full"
57
- }
 
1
  {
2
  "_commit_hash": null,
3
+ "_name_or_path": "../pixtral",
4
  "architectures": [
5
  "LlavaForConditionalGeneration"
6
  ],
7
+ "ignore_index": -100,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8
  "image_seq_length": 1,
9
  "image_token_index": 10,
10
+ "model_type": "llava",
11
  "projector_hidden_act": "gelu",
12
  "text_config": {
13
  "hidden_size": 5120,
 
15
  "intermediate_size": 14336,
16
  "is_composition": true,
17
  "max_position_embeddings": 1024000,
18
+ "model_type": "mistral",
19
  "num_hidden_layers": 40,
20
  "num_key_value_heads": 8,
21
  "rms_norm_eps": 1e-05,
 
23
  "sliding_window": null,
24
  "vocab_size": 131072
25
  },
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": null,
28
  "vision_config": {
29
  "head_dim": 64,
30
  "hidden_act": "silu",
31
  "image_size": 1024,
32
  "is_composition": true,
33
+ "model_type": "pixtral",
34
  "patch_size": 16,
35
  "rope_theta": 10000.0,
36
  "tie_word_embeddings": false
37
  },
38
  "vision_feature_layer": -1,
39
  "vision_feature_select_strategy": "full"
40
+ }
special_tokens_map.json CHANGED
@@ -13,13 +13,6 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": {
17
- "content": "[PAD]",
18
- "lstrip": false,
19
- "normalized": false,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
  "unk_token": {
24
  "content": "<unk>",
25
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
 
 
 
 
 
 
 
16
  "unk_token": {
17
  "content": "<unk>",
18
  "lstrip": false,
tokenizer.json CHANGED
@@ -95,7 +95,7 @@
95
  },
96
  {
97
  "id": 10,
98
- "content": "<pad>",
99
  "single_word": false,
100
  "lstrip": false,
101
  "rstrip": false,
@@ -104,7 +104,7 @@
104
  },
105
  {
106
  "id": 11,
107
- "content": "[PREFIX]",
108
  "single_word": false,
109
  "lstrip": false,
110
  "rstrip": false,
@@ -113,7 +113,7 @@
113
  },
114
  {
115
  "id": 12,
116
- "content": "[MIDDLE]",
117
  "single_word": false,
118
  "lstrip": false,
119
  "rstrip": false,
@@ -122,7 +122,7 @@
122
  },
123
  {
124
  "id": 13,
125
- "content": "[SUFFIX]",
126
  "single_word": false,
127
  "lstrip": false,
128
  "rstrip": false,
@@ -131,7 +131,7 @@
131
  },
132
  {
133
  "id": 14,
134
- "content": "<SPECIAL_14>",
135
  "single_word": false,
136
  "lstrip": false,
137
  "rstrip": false,
@@ -140,7 +140,7 @@
140
  },
141
  {
142
  "id": 15,
143
- "content": "<SPECIAL_15>",
144
  "single_word": false,
145
  "lstrip": false,
146
  "rstrip": false,
@@ -149,7 +149,7 @@
149
  },
150
  {
151
  "id": 16,
152
- "content": "<SPECIAL_16>",
153
  "single_word": false,
154
  "lstrip": false,
155
  "rstrip": false,
@@ -9002,15 +9002,6 @@
9002
  "rstrip": false,
9003
  "normalized": false,
9004
  "special": true
9005
- },
9006
- {
9007
- "id": 131072,
9008
- "content": "[PAD]",
9009
- "single_word": false,
9010
- "lstrip": false,
9011
- "rstrip": false,
9012
- "normalized": false,
9013
- "special": true
9014
  }
9015
  ],
9016
  "normalizer": null,
@@ -9020,7 +9011,7 @@
9020
  {
9021
  "type": "Split",
9022
  "pattern": {
9023
- "Regex": "[^\\r\\n\\p{L}\\p{N}]?[\\p{Lu}\\p{Lt}\\p{Lm}\\p{Lo}\\p{M}]*[\\p{Ll}\\p{Lm}\\p{Lo}\\p{M}]+|[^\\r\\n\\p{L}\\p{N}]?[\\p{Lu}\\p{Lt}\\p{Lm}\\p{Lo}\\p{M}]+[\\p{Ll}\\p{Lm}\\p{Lo}\\p{M}]*|\\p{N}| ?[^\\s\\p{L}\\p{N}]+[\\r\\n/]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+"
9024
  },
9025
  "behavior": "Isolated",
9026
  "invert": false
@@ -9034,67 +9025,10 @@
9034
  ]
9035
  },
9036
  "post_processor": {
9037
- "type": "TemplateProcessing",
9038
- "single": [
9039
- {
9040
- "SpecialToken": {
9041
- "id": "<s>",
9042
- "type_id": 0
9043
- }
9044
- },
9045
- {
9046
- "Sequence": {
9047
- "id": "A",
9048
- "type_id": 0
9049
- }
9050
- }
9051
- ],
9052
- "pair": [
9053
- {
9054
- "SpecialToken": {
9055
- "id": "<s>",
9056
- "type_id": 0
9057
- }
9058
- },
9059
- {
9060
- "Sequence": {
9061
- "id": "A",
9062
- "type_id": 0
9063
- }
9064
- },
9065
- {
9066
- "SpecialToken": {
9067
- "id": "<s>",
9068
- "type_id": 1
9069
- }
9070
- },
9071
- {
9072
- "Sequence": {
9073
- "id": "B",
9074
- "type_id": 1
9075
- }
9076
- }
9077
- ],
9078
- "special_tokens": {
9079
- "</s>": {
9080
- "id": "</s>",
9081
- "ids": [
9082
- 2
9083
- ],
9084
- "tokens": [
9085
- "</s>"
9086
- ]
9087
- },
9088
- "<s>": {
9089
- "id": "<s>",
9090
- "ids": [
9091
- 1
9092
- ],
9093
- "tokens": [
9094
- "<s>"
9095
- ]
9096
- }
9097
- }
9098
  },
9099
  "decoder": {
9100
  "type": "ByteLevel",
@@ -9122,13 +9056,13 @@
9122
  "[TOOL_RESULTS]": 7,
9123
  "[/TOOL_RESULTS]": 8,
9124
  "[TOOL_CALLS]": 9,
9125
- "<pad>": 10,
9126
- "[PREFIX]": 11,
9127
- "[MIDDLE]": 12,
9128
- "[SUFFIX]": 13,
9129
- "<SPECIAL_14>": 14,
9130
- "<SPECIAL_15>": 15,
9131
- "<SPECIAL_16>": 16,
9132
  "<SPECIAL_17>": 17,
9133
  "<SPECIAL_18>": 18,
9134
  "<SPECIAL_19>": 19,
 
95
  },
96
  {
97
  "id": 10,
98
+ "content": "[IMG]",
99
  "single_word": false,
100
  "lstrip": false,
101
  "rstrip": false,
 
104
  },
105
  {
106
  "id": 11,
107
+ "content": "<pad>",
108
  "single_word": false,
109
  "lstrip": false,
110
  "rstrip": false,
 
113
  },
114
  {
115
  "id": 12,
116
+ "content": "[IMG_BREAK]",
117
  "single_word": false,
118
  "lstrip": false,
119
  "rstrip": false,
 
122
  },
123
  {
124
  "id": 13,
125
+ "content": "[IMG_END]",
126
  "single_word": false,
127
  "lstrip": false,
128
  "rstrip": false,
 
131
  },
132
  {
133
  "id": 14,
134
+ "content": "[PREFIX]",
135
  "single_word": false,
136
  "lstrip": false,
137
  "rstrip": false,
 
140
  },
141
  {
142
  "id": 15,
143
+ "content": "[MIDDLE]",
144
  "single_word": false,
145
  "lstrip": false,
146
  "rstrip": false,
 
149
  },
150
  {
151
  "id": 16,
152
+ "content": "[SUFFIX]",
153
  "single_word": false,
154
  "lstrip": false,
155
  "rstrip": false,
 
9002
  "rstrip": false,
9003
  "normalized": false,
9004
  "special": true
 
 
 
 
 
 
 
 
 
9005
  }
9006
  ],
9007
  "normalizer": null,
 
9011
  {
9012
  "type": "Split",
9013
  "pattern": {
9014
+ "Regex": "(?i:'s|'t|'re|'ve|'m|'ll|'d)|[^\\r\\n\\p{L}\\p{N}]?\\p{L}+|\\p{N}{1,3}| ?[^\\s\\p{L}\\p{N}]+[\\r\\n]*|\\s*[\\r\\n]+|\\s+(?!\\S)|\\s+"
9015
  },
9016
  "behavior": "Isolated",
9017
  "invert": false
 
9025
  ]
9026
  },
9027
  "post_processor": {
9028
+ "type": "ByteLevel",
9029
+ "add_prefix_space": true,
9030
+ "trim_offsets": false,
9031
+ "use_regex": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9032
  },
9033
  "decoder": {
9034
  "type": "ByteLevel",
 
9056
  "[TOOL_RESULTS]": 7,
9057
  "[/TOOL_RESULTS]": 8,
9058
  "[TOOL_CALLS]": 9,
9059
+ "[IMG]": 10,
9060
+ "<pad>": 11,
9061
+ "[IMG_BREAK]": 12,
9062
+ "[IMG_END]": 13,
9063
+ "[PREFIX]": 14,
9064
+ "[MIDDLE]": 15,
9065
+ "[SUFFIX]": 16,
9066
  "<SPECIAL_17>": 17,
9067
  "<SPECIAL_18>": 18,
9068
  "<SPECIAL_19>": 19,
tokenizer_config.json CHANGED
@@ -1,7 +1,4 @@
1
  {
2
- "add_bos_token": true,
3
- "add_eos_token": false,
4
- "add_prefix_space": false,
5
  "added_tokens_decoder": {
6
  "0": {
7
  "content": "<unk>",
@@ -84,7 +81,7 @@
84
  "special": true
85
  },
86
  "10": {
87
- "content": "<pad>",
88
  "lstrip": false,
89
  "normalized": false,
90
  "rstrip": false,
@@ -92,7 +89,7 @@
92
  "special": true
93
  },
94
  "11": {
95
- "content": "[PREFIX]",
96
  "lstrip": false,
97
  "normalized": false,
98
  "rstrip": false,
@@ -100,7 +97,7 @@
100
  "special": true
101
  },
102
  "12": {
103
- "content": "[MIDDLE]",
104
  "lstrip": false,
105
  "normalized": false,
106
  "rstrip": false,
@@ -108,7 +105,7 @@
108
  "special": true
109
  },
110
  "13": {
111
- "content": "[SUFFIX]",
112
  "lstrip": false,
113
  "normalized": false,
114
  "rstrip": false,
@@ -116,7 +113,7 @@
116
  "special": true
117
  },
118
  "14": {
119
- "content": "<SPECIAL_14>",
120
  "lstrip": false,
121
  "normalized": false,
122
  "rstrip": false,
@@ -124,7 +121,7 @@
124
  "special": true
125
  },
126
  "15": {
127
- "content": "<SPECIAL_15>",
128
  "lstrip": false,
129
  "normalized": false,
130
  "rstrip": false,
@@ -132,7 +129,7 @@
132
  "special": true
133
  },
134
  "16": {
135
- "content": "<SPECIAL_16>",
136
  "lstrip": false,
137
  "normalized": false,
138
  "rstrip": false,
@@ -8002,22 +7999,17 @@
8002
  "rstrip": false,
8003
  "single_word": false,
8004
  "special": true
8005
- },
8006
- "131072": {
8007
- "content": "[PAD]",
8008
- "lstrip": false,
8009
- "normalized": false,
8010
- "rstrip": false,
8011
- "single_word": false,
8012
- "special": true
8013
  }
8014
  },
8015
  "bos_token": "<s>",
8016
- "chat_template": "{{ bos_token }}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ '[INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
8017
- "clean_up_tokenization_spaces": false,
8018
  "eos_token": "</s>",
 
 
 
 
8019
  "model_max_length": 1000000000000000019884624838656,
8020
- "pad_token": "[PAD]",
8021
  "tokenizer_class": "PreTrainedTokenizerFast",
8022
  "unk_token": "<unk>"
8023
  }
 
1
  {
 
 
 
2
  "added_tokens_decoder": {
3
  "0": {
4
  "content": "<unk>",
 
81
  "special": true
82
  },
83
  "10": {
84
+ "content": "[IMG]",
85
  "lstrip": false,
86
  "normalized": false,
87
  "rstrip": false,
 
89
  "special": true
90
  },
91
  "11": {
92
+ "content": "<pad>",
93
  "lstrip": false,
94
  "normalized": false,
95
  "rstrip": false,
 
97
  "special": true
98
  },
99
  "12": {
100
+ "content": "[IMG_BREAK]",
101
  "lstrip": false,
102
  "normalized": false,
103
  "rstrip": false,
 
105
  "special": true
106
  },
107
  "13": {
108
+ "content": "[IMG_END]",
109
  "lstrip": false,
110
  "normalized": false,
111
  "rstrip": false,
 
113
  "special": true
114
  },
115
  "14": {
116
+ "content": "[PREFIX]",
117
  "lstrip": false,
118
  "normalized": false,
119
  "rstrip": false,
 
121
  "special": true
122
  },
123
  "15": {
124
+ "content": "[MIDDLE]",
125
  "lstrip": false,
126
  "normalized": false,
127
  "rstrip": false,
 
129
  "special": true
130
  },
131
  "16": {
132
+ "content": "[SUFFIX]",
133
  "lstrip": false,
134
  "normalized": false,
135
  "rstrip": false,
 
7999
  "rstrip": false,
8000
  "single_word": false,
8001
  "special": true
 
 
 
 
 
 
 
 
8002
  }
8003
  },
8004
  "bos_token": "<s>",
8005
+ "clean_up_tokenization_spaces": true,
 
8006
  "eos_token": "</s>",
8007
+ "model_input_names": [
8008
+ "input_ids",
8009
+ "attention_mask"
8010
+ ],
8011
  "model_max_length": 1000000000000000019884624838656,
8012
+ "processor_class": "PixtralProcessor",
8013
  "tokenizer_class": "PreTrainedTokenizerFast",
8014
  "unk_token": "<unk>"
8015
  }