Update README.md
Browse files
README.md
CHANGED
|
@@ -67,7 +67,7 @@ custom="
|
|
| 67 |
blk\.0\.ffn_down\.weight=q8_0
|
| 68 |
blk\.0\.ffn_gate\.weight=q8_0
|
| 69 |
blk\.0\.ffn_up\.weight=q8_0
|
| 70 |
-
blk\.46\.nextn\.eh_proj\.weight=
|
| 71 |
blk\.46\.nextn\.embed_tokens\.weight=q8_0
|
| 72 |
blk\.46\.nextn\.enorm\.weight=f32
|
| 73 |
blk\.46\.nextn\.hnorm\.weight=f32
|
|
@@ -104,32 +104,32 @@ blk\.4[0-6]\.post_attention_norm\.weight=f32
|
|
| 104 |
|
| 105 |
blk\.[1-9]\.exp_probs_b\.bias=f32
|
| 106 |
blk\.[1-9]\.ffn_down_exps\.weight=q8_0
|
| 107 |
-
blk\.[1-9]\.ffn_down_shexp\.weight=
|
| 108 |
blk\.[1-9]\.ffn_gate_exps\.weight=q4_K
|
| 109 |
blk\.[1-9]\.ffn_gate_inp\.weight=f32
|
| 110 |
-
blk\.[1-9]\.ffn_gate_shexp\.weight=
|
| 111 |
blk\.[1-9]\.ffn_up_exps\.weight=q4_K
|
| 112 |
-
blk\.[1-9]\.ffn_up_shexp\.weight=
|
| 113 |
blk\.[1-3][0-9]\.exp_probs_b\.bias=f32
|
| 114 |
blk\.[1-3][0-9]\.ffn_down_exps\.weight=q8_0
|
| 115 |
-
blk\.[1-3][0-9]\.ffn_down_shexp\.weight=
|
| 116 |
blk\.[1-3][0-9]\.ffn_gate_exps\.weight=q4_K
|
| 117 |
blk\.[1-3][0-9]\.ffn_gate_inp\.weight=f32
|
| 118 |
-
blk\.[1-3][0-9]\.ffn_gate_shexp\.weight=
|
| 119 |
blk\.[1-3][0-9]\.ffn_up_exps\.weight=q4_K
|
| 120 |
-
blk\.[1-3][0-9]\.ffn_up_shexp\.weight=
|
| 121 |
blk\.4[0-6]\.exp_probs_b\.bias=f32
|
| 122 |
blk\.4[0-6]\.ffn_down_exps\.weight=q8_0
|
| 123 |
-
blk\.4[0-6]\.ffn_down_shexp\.weight=
|
| 124 |
blk\.4[0-6]\.ffn_gate_exps\.weight=q4_K
|
| 125 |
blk\.4[0-6]\.ffn_gate_inp\.weight=f32
|
| 126 |
-
blk\.4[0-6]\.ffn_gate_shexp\.weight=
|
| 127 |
blk\.4[0-6]\.ffn_up_exps\.weight=q4_K
|
| 128 |
-
blk\.4[0-6]\.ffn_up_shexp\.weight=
|
| 129 |
|
| 130 |
-
output\.weight=
|
| 131 |
output_norm\.weight=f32
|
| 132 |
-
token_embd\.weight=
|
| 133 |
"
|
| 134 |
|
| 135 |
custom=$(
|
|
@@ -143,7 +143,7 @@ TARGET_MODEL="GLM-4.5-Air-HQ4_K"
|
|
| 143 |
mkdir -p ~/Env/models/anikifoss/$TARGET_MODEL
|
| 144 |
./build/bin/llama-quantize \
|
| 145 |
--custom-q "$custom" \
|
| 146 |
-
/mnt/data/Models/zai-org/GLM-4.5-Air-GGUF/GLM-4.5-Air-128x9.4B-
|
| 147 |
~/Env/models/anikifoss/$TARGET_MODEL/$TARGET_MODEL.gguf \
|
| 148 |
Q4_K \
|
| 149 |
32
|
|
|
|
| 67 |
blk\.0\.ffn_down\.weight=q8_0
|
| 68 |
blk\.0\.ffn_gate\.weight=q8_0
|
| 69 |
blk\.0\.ffn_up\.weight=q8_0
|
| 70 |
+
blk\.46\.nextn\.eh_proj\.weight=bf16
|
| 71 |
blk\.46\.nextn\.embed_tokens\.weight=q8_0
|
| 72 |
blk\.46\.nextn\.enorm\.weight=f32
|
| 73 |
blk\.46\.nextn\.hnorm\.weight=f32
|
|
|
|
| 104 |
|
| 105 |
blk\.[1-9]\.exp_probs_b\.bias=f32
|
| 106 |
blk\.[1-9]\.ffn_down_exps\.weight=q8_0
|
| 107 |
+
blk\.[1-9]\.ffn_down_shexp\.weight=bf16
|
| 108 |
blk\.[1-9]\.ffn_gate_exps\.weight=q4_K
|
| 109 |
blk\.[1-9]\.ffn_gate_inp\.weight=f32
|
| 110 |
+
blk\.[1-9]\.ffn_gate_shexp\.weight=bf16
|
| 111 |
blk\.[1-9]\.ffn_up_exps\.weight=q4_K
|
| 112 |
+
blk\.[1-9]\.ffn_up_shexp\.weight=bf16
|
| 113 |
blk\.[1-3][0-9]\.exp_probs_b\.bias=f32
|
| 114 |
blk\.[1-3][0-9]\.ffn_down_exps\.weight=q8_0
|
| 115 |
+
blk\.[1-3][0-9]\.ffn_down_shexp\.weight=bf16
|
| 116 |
blk\.[1-3][0-9]\.ffn_gate_exps\.weight=q4_K
|
| 117 |
blk\.[1-3][0-9]\.ffn_gate_inp\.weight=f32
|
| 118 |
+
blk\.[1-3][0-9]\.ffn_gate_shexp\.weight=bf16
|
| 119 |
blk\.[1-3][0-9]\.ffn_up_exps\.weight=q4_K
|
| 120 |
+
blk\.[1-3][0-9]\.ffn_up_shexp\.weight=bf16
|
| 121 |
blk\.4[0-6]\.exp_probs_b\.bias=f32
|
| 122 |
blk\.4[0-6]\.ffn_down_exps\.weight=q8_0
|
| 123 |
+
blk\.4[0-6]\.ffn_down_shexp\.weight=bf16
|
| 124 |
blk\.4[0-6]\.ffn_gate_exps\.weight=q4_K
|
| 125 |
blk\.4[0-6]\.ffn_gate_inp\.weight=f32
|
| 126 |
+
blk\.4[0-6]\.ffn_gate_shexp\.weight=bf16
|
| 127 |
blk\.4[0-6]\.ffn_up_exps\.weight=q4_K
|
| 128 |
+
blk\.4[0-6]\.ffn_up_shexp\.weight=bf16
|
| 129 |
|
| 130 |
+
output\.weight=bf16
|
| 131 |
output_norm\.weight=f32
|
| 132 |
+
token_embd\.weight=bf16
|
| 133 |
"
|
| 134 |
|
| 135 |
custom=$(
|
|
|
|
| 143 |
mkdir -p ~/Env/models/anikifoss/$TARGET_MODEL
|
| 144 |
./build/bin/llama-quantize \
|
| 145 |
--custom-q "$custom" \
|
| 146 |
+
/mnt/data/Models/zai-org/GLM-4.5-Air-GGUF/GLM-4.5-Air-128x9.4B-BF16-00001-of-00005.gguf \
|
| 147 |
~/Env/models/anikifoss/$TARGET_MODEL/$TARGET_MODEL.gguf \
|
| 148 |
Q4_K \
|
| 149 |
32
|