anikifoss commited on
Commit
38c2ba8
·
verified ·
1 Parent(s): c17ddd0

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +13 -13
README.md CHANGED
@@ -67,7 +67,7 @@ custom="
67
  blk\.0\.ffn_down\.weight=q8_0
68
  blk\.0\.ffn_gate\.weight=q8_0
69
  blk\.0\.ffn_up\.weight=q8_0
70
- blk\.46\.nextn\.eh_proj\.weight=f16
71
  blk\.46\.nextn\.embed_tokens\.weight=q8_0
72
  blk\.46\.nextn\.enorm\.weight=f32
73
  blk\.46\.nextn\.hnorm\.weight=f32
@@ -104,32 +104,32 @@ blk\.4[0-6]\.post_attention_norm\.weight=f32
104
 
105
  blk\.[1-9]\.exp_probs_b\.bias=f32
106
  blk\.[1-9]\.ffn_down_exps\.weight=q8_0
107
- blk\.[1-9]\.ffn_down_shexp\.weight=f16
108
  blk\.[1-9]\.ffn_gate_exps\.weight=q4_K
109
  blk\.[1-9]\.ffn_gate_inp\.weight=f32
110
- blk\.[1-9]\.ffn_gate_shexp\.weight=f16
111
  blk\.[1-9]\.ffn_up_exps\.weight=q4_K
112
- blk\.[1-9]\.ffn_up_shexp\.weight=f16
113
  blk\.[1-3][0-9]\.exp_probs_b\.bias=f32
114
  blk\.[1-3][0-9]\.ffn_down_exps\.weight=q8_0
115
- blk\.[1-3][0-9]\.ffn_down_shexp\.weight=f16
116
  blk\.[1-3][0-9]\.ffn_gate_exps\.weight=q4_K
117
  blk\.[1-3][0-9]\.ffn_gate_inp\.weight=f32
118
- blk\.[1-3][0-9]\.ffn_gate_shexp\.weight=f16
119
  blk\.[1-3][0-9]\.ffn_up_exps\.weight=q4_K
120
- blk\.[1-3][0-9]\.ffn_up_shexp\.weight=f16
121
  blk\.4[0-6]\.exp_probs_b\.bias=f32
122
  blk\.4[0-6]\.ffn_down_exps\.weight=q8_0
123
- blk\.4[0-6]\.ffn_down_shexp\.weight=f16
124
  blk\.4[0-6]\.ffn_gate_exps\.weight=q4_K
125
  blk\.4[0-6]\.ffn_gate_inp\.weight=f32
126
- blk\.4[0-6]\.ffn_gate_shexp\.weight=f16
127
  blk\.4[0-6]\.ffn_up_exps\.weight=q4_K
128
- blk\.4[0-6]\.ffn_up_shexp\.weight=f16
129
 
130
- output\.weight=f16
131
  output_norm\.weight=f32
132
- token_embd\.weight=f16
133
  "
134
 
135
  custom=$(
@@ -143,7 +143,7 @@ TARGET_MODEL="GLM-4.5-Air-HQ4_K"
143
  mkdir -p ~/Env/models/anikifoss/$TARGET_MODEL
144
  ./build/bin/llama-quantize \
145
  --custom-q "$custom" \
146
- /mnt/data/Models/zai-org/GLM-4.5-Air-GGUF/GLM-4.5-Air-128x9.4B-F16-00001-of-00005.gguf \
147
  ~/Env/models/anikifoss/$TARGET_MODEL/$TARGET_MODEL.gguf \
148
  Q4_K \
149
  32
 
67
  blk\.0\.ffn_down\.weight=q8_0
68
  blk\.0\.ffn_gate\.weight=q8_0
69
  blk\.0\.ffn_up\.weight=q8_0
70
+ blk\.46\.nextn\.eh_proj\.weight=bf16
71
  blk\.46\.nextn\.embed_tokens\.weight=q8_0
72
  blk\.46\.nextn\.enorm\.weight=f32
73
  blk\.46\.nextn\.hnorm\.weight=f32
 
104
 
105
  blk\.[1-9]\.exp_probs_b\.bias=f32
106
  blk\.[1-9]\.ffn_down_exps\.weight=q8_0
107
+ blk\.[1-9]\.ffn_down_shexp\.weight=bf16
108
  blk\.[1-9]\.ffn_gate_exps\.weight=q4_K
109
  blk\.[1-9]\.ffn_gate_inp\.weight=f32
110
+ blk\.[1-9]\.ffn_gate_shexp\.weight=bf16
111
  blk\.[1-9]\.ffn_up_exps\.weight=q4_K
112
+ blk\.[1-9]\.ffn_up_shexp\.weight=bf16
113
  blk\.[1-3][0-9]\.exp_probs_b\.bias=f32
114
  blk\.[1-3][0-9]\.ffn_down_exps\.weight=q8_0
115
+ blk\.[1-3][0-9]\.ffn_down_shexp\.weight=bf16
116
  blk\.[1-3][0-9]\.ffn_gate_exps\.weight=q4_K
117
  blk\.[1-3][0-9]\.ffn_gate_inp\.weight=f32
118
+ blk\.[1-3][0-9]\.ffn_gate_shexp\.weight=bf16
119
  blk\.[1-3][0-9]\.ffn_up_exps\.weight=q4_K
120
+ blk\.[1-3][0-9]\.ffn_up_shexp\.weight=bf16
121
  blk\.4[0-6]\.exp_probs_b\.bias=f32
122
  blk\.4[0-6]\.ffn_down_exps\.weight=q8_0
123
+ blk\.4[0-6]\.ffn_down_shexp\.weight=bf16
124
  blk\.4[0-6]\.ffn_gate_exps\.weight=q4_K
125
  blk\.4[0-6]\.ffn_gate_inp\.weight=f32
126
+ blk\.4[0-6]\.ffn_gate_shexp\.weight=bf16
127
  blk\.4[0-6]\.ffn_up_exps\.weight=q4_K
128
+ blk\.4[0-6]\.ffn_up_shexp\.weight=bf16
129
 
130
+ output\.weight=bf16
131
  output_norm\.weight=f32
132
+ token_embd\.weight=bf16
133
  "
134
 
135
  custom=$(
 
143
  mkdir -p ~/Env/models/anikifoss/$TARGET_MODEL
144
  ./build/bin/llama-quantize \
145
  --custom-q "$custom" \
146
+ /mnt/data/Models/zai-org/GLM-4.5-Air-GGUF/GLM-4.5-Air-128x9.4B-BF16-00001-of-00005.gguf \
147
  ~/Env/models/anikifoss/$TARGET_MODEL/$TARGET_MODEL.gguf \
148
  Q4_K \
149
  32