Upload MllamaForConditionalGeneration
Browse files- config.json +12 -38
- model-00001-of-00002.safetensors +2 -2
- model-00002-of-00002.safetensors +2 -2
- model.safetensors.index.json +0 -0
config.json
CHANGED
|
@@ -19,44 +19,18 @@
|
|
| 19 |
"multi_modal_projector",
|
| 20 |
"merger",
|
| 21 |
"modality_projection",
|
| 22 |
-
"
|
| 23 |
-
"
|
| 24 |
-
"vision_model.transformer.layers.
|
| 25 |
-
"
|
| 26 |
-
"
|
| 27 |
-
"
|
| 28 |
-
"
|
| 29 |
-
"
|
| 30 |
-
"
|
| 31 |
-
"
|
| 32 |
-
"
|
| 33 |
-
"
|
| 34 |
-
"vision_model.transformer.layers.12.mlp",
|
| 35 |
-
"vision_model.transformer.layers.13.mlp",
|
| 36 |
-
"vision_model.transformer.layers.14.mlp",
|
| 37 |
-
"vision_model.transformer.layers.15.mlp",
|
| 38 |
-
"vision_model.transformer.layers.16.mlp",
|
| 39 |
-
"vision_model.transformer.layers.17.mlp",
|
| 40 |
-
"vision_model.transformer.layers.18.mlp",
|
| 41 |
-
"vision_model.transformer.layers.19.mlp",
|
| 42 |
-
"vision_model.transformer.layers.20.mlp",
|
| 43 |
-
"vision_model.transformer.layers.21.mlp",
|
| 44 |
-
"vision_model.transformer.layers.22.mlp",
|
| 45 |
-
"vision_model.transformer.layers.23.mlp",
|
| 46 |
-
"vision_model.transformer.layers.24.mlp",
|
| 47 |
-
"vision_model.transformer.layers.25.mlp",
|
| 48 |
-
"vision_model.transformer.layers.26.mlp",
|
| 49 |
-
"vision_model.transformer.layers.27.mlp",
|
| 50 |
-
"vision_model.transformer.layers.28.mlp",
|
| 51 |
-
"vision_model.transformer.layers.29.mlp",
|
| 52 |
-
"vision_model.transformer.layers.30.mlp",
|
| 53 |
-
"vision_model.transformer.layers.31.mlp",
|
| 54 |
-
"vision_model.global_transformer.layers.0.mlp",
|
| 55 |
-
"vision_model.global_transformer.layers.1.mlp",
|
| 56 |
-
"vision_model.global_transformer.layers.2.mlp",
|
| 57 |
-
"vision_model.global_transformer.layers.3.mlp",
|
| 58 |
-
"vision_model.global_transformer.layers.4.mlp",
|
| 59 |
-
"vision_model.global_transformer.layers.5.mlp"
|
| 60 |
],
|
| 61 |
"llm_int8_threshold": 6.0,
|
| 62 |
"load_in_4bit": true,
|
|
|
|
| 19 |
"multi_modal_projector",
|
| 20 |
"merger",
|
| 21 |
"modality_projection",
|
| 22 |
+
"language_model.model.layers.1.self_attn",
|
| 23 |
+
"language_model.model.layers.1.mlp",
|
| 24 |
+
"vision_model.transformer.layers.13.mlp.fc2",
|
| 25 |
+
"language_model.model.layers.8.cross_attn.o_proj",
|
| 26 |
+
"language_model.model.layers.13.cross_attn.o_proj",
|
| 27 |
+
"language_model.model.layers.13.mlp.down_proj",
|
| 28 |
+
"language_model.model.layers.18.cross_attn.o_proj",
|
| 29 |
+
"language_model.model.layers.18.mlp.down_proj",
|
| 30 |
+
"language_model.model.layers.23.cross_attn.o_proj",
|
| 31 |
+
"language_model.model.layers.28.cross_attn.o_proj",
|
| 32 |
+
"language_model.model.layers.33.cross_attn.o_proj",
|
| 33 |
+
"language_model.model.layers.38.cross_attn.o_proj"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 34 |
],
|
| 35 |
"llm_int8_threshold": 6.0,
|
| 36 |
"load_in_4bit": true,
|
model-00001-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:afad208b9b805474e7f5d8de82043cf970f6e799c0b655cd6c6e522b9371e618
|
| 3 |
+
size 4971535505
|
model-00002-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc63401a455ef422970874eabac70ebf6380eb565c592341c4932092f569f720
|
| 3 |
+
size 2937067316
|
model.safetensors.index.json
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|