Shubhra Pandit commited on
Commit
7c8cecf
·
1 Parent(s): 1fd4e36

Update model files

Browse files
Files changed (4) hide show
  1. config.json +4 -4
  2. model.safetensors +2 -2
  3. recipe.yaml +2 -2
  4. tokenizer.json +1 -6
config.json CHANGED
@@ -30,10 +30,10 @@
30
  "Linear"
31
  ],
32
  "weights": {
33
- "actorder": "group",
34
  "block_structure": null,
35
  "dynamic": false,
36
- "group_size": 128,
37
  "num_bits": 4,
38
  "observer": "mse",
39
  "observer_kwargs": {},
@@ -44,7 +44,7 @@
44
  }
45
  },
46
  "format": "pack-quantized",
47
- "global_compression_ratio": 2.0800281480274516,
48
  "ignore": [
49
  "lm_head"
50
  ],
@@ -53,7 +53,7 @@
53
  "quantization_status": "compressed",
54
  "sparsity_config": {
55
  "format": "dense",
56
- "global_sparsity": 0.13778556247646417,
57
  "ignore": [],
58
  "registry_requires_subclass": false,
59
  "sparsity_structure": "unstructured",
 
30
  "Linear"
31
  ],
32
  "weights": {
33
+ "actorder": null,
34
  "block_structure": null,
35
  "dynamic": false,
36
+ "group_size": 64,
37
  "num_bits": 4,
38
  "observer": "mse",
39
  "observer_kwargs": {},
 
44
  }
45
  },
46
  "format": "pack-quantized",
47
+ "global_compression_ratio": 2.0771812517233883,
48
  "ignore": [
49
  "lm_head"
50
  ],
 
53
  "quantization_status": "compressed",
54
  "sparsity_config": {
55
  "format": "dense",
56
+ "global_sparsity": 0.13633800160480383,
57
  "ignore": [],
58
  "registry_requires_subclass": false,
59
  "sparsity_structure": "unstructured",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c42b5cdd5beb78f6424aeb76d144e000fb2effa6276fce51f387bfad9e4549e
3
- size 1660786656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80eacfccfdee065bac8252fc7e806717b506678e7e35090eb0b3246380e9b4fb
3
+ size 1695488752
recipe.yaml CHANGED
@@ -6,6 +6,6 @@ quant_stage:
6
  ignore: [lm_head]
7
  config_groups:
8
  group_0:
9
- weights: {num_bits: 4, type: int, symmetric: true, strategy: group, group_size: 128,
10
- actorder: group, observer: mse}
11
  targets: [Linear]
 
6
  ignore: [lm_head]
7
  config_groups:
8
  group_0:
9
+ weights: {num_bits: 4, type: int, symmetric: true, strategy: group, group_size: 64,
10
+ observer: mse}
11
  targets: [Linear]
tokenizer.json CHANGED
@@ -1,11 +1,6 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 8196,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": null,
10
  "added_tokens": [
11
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {