OPEA
/

Safetensors
qwen2
4-bit precision
auto-round
cicdatopea commited on
Commit
721052a
·
verified ·
1 Parent(s): 57170f1

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +1 -68
config.json CHANGED
@@ -51,74 +51,7 @@
51
  "scale_dtype": "torch.float16",
52
  "seqlen": 2048,
53
  "sym": true,
54
- "to_quant_block_names": [
55
- [
56
- "model.layers.0",
57
- "model.layers.1",
58
- "model.layers.2",
59
- "model.layers.3",
60
- "model.layers.4",
61
- "model.layers.5",
62
- "model.layers.6",
63
- "model.layers.7",
64
- "model.layers.8",
65
- "model.layers.9",
66
- "model.layers.10",
67
- "model.layers.11",
68
- "model.layers.12",
69
- "model.layers.13",
70
- "model.layers.14",
71
- "model.layers.15",
72
- "model.layers.16",
73
- "model.layers.17",
74
- "model.layers.18",
75
- "model.layers.19",
76
- "model.layers.20",
77
- "model.layers.21",
78
- "model.layers.22",
79
- "model.layers.23",
80
- "model.layers.24",
81
- "model.layers.25",
82
- "model.layers.26",
83
- "model.layers.27",
84
- "model.layers.28",
85
- "model.layers.29",
86
- "model.layers.30",
87
- "model.layers.31",
88
- "model.layers.32",
89
- "model.layers.33",
90
- "model.layers.34",
91
- "model.layers.35",
92
- "model.layers.36",
93
- "model.layers.37",
94
- "model.layers.38",
95
- "model.layers.39",
96
- "model.layers.40",
97
- "model.layers.41",
98
- "model.layers.42",
99
- "model.layers.43",
100
- "model.layers.44",
101
- "model.layers.45",
102
- "model.layers.46",
103
- "model.layers.47",
104
- "model.layers.48",
105
- "model.layers.49",
106
- "model.layers.50",
107
- "model.layers.51",
108
- "model.layers.52",
109
- "model.layers.53",
110
- "model.layers.54",
111
- "model.layers.55",
112
- "model.layers.56",
113
- "model.layers.57",
114
- "model.layers.58",
115
- "model.layers.59",
116
- "model.layers.60",
117
- "model.layers.61",
118
- "model.layers.62",
119
- "model.layers.63"
120
- ]
121
- ]
122
  },
123
  "rms_norm_eps": 1e-05,
124
  "rope_scaling": null,
 
51
  "scale_dtype": "torch.float16",
52
  "seqlen": 2048,
53
  "sym": true,
54
+ "block_name_to_quantize": "model.layers"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  },
56
  "rms_norm_eps": 1e-05,
57
  "rope_scaling": null,