Upload Qwen2AudioForConditionalGeneration

Files changed (5) hide show

config.json CHANGED Viewed

@@ -5,7 +5,7 @@
   ],
   "audio_config": {
     "model_type": "qwen2_audio_encoder",
-    "torch_dtype": "float32"
   },
   "audio_token_index": 151646,
   "ignore_index": -100,
@@ -44,7 +44,7 @@
       }
     },
     "format": "int-quantized",
-    "global_compression_ratio": 2.02943919718519,
     "ignore": [],
     "kv_cache_scheme": null,
     "quant_method": "compressed-tensors",
@@ -58,11 +58,11 @@
     "model_type": "qwen2",
     "rms_norm_eps": 1e-05,
     "sliding_window": null,
-    "torch_dtype": "float32",
     "use_mrope": false,
     "vocab_size": 156032
   },
-  "torch_dtype": "float32",
   "transformers_version": "4.49.0",
   "vocab_size": 156032
 }

   ],
   "audio_config": {
     "model_type": "qwen2_audio_encoder",
+    "torch_dtype": "bfloat16"
   },
   "audio_token_index": 151646,
   "ignore_index": -100,
       }
     },
     "format": "int-quantized",
+    "global_compression_ratio": 1.510915647565434,
     "ignore": [],
     "kv_cache_scheme": null,
     "quant_method": "compressed-tensors",
     "model_type": "qwen2",
     "rms_norm_eps": 1e-05,
     "sliding_window": null,
+    "torch_dtype": "bfloat16",
     "use_mrope": false,
     "vocab_size": 156032
   },
+  "torch_dtype": "bfloat16",
   "transformers_version": "4.49.0",
   "vocab_size": 156032
 }

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:de8191ef44c9e32fe0b6d7b88688998843fcce1f69217513069ee4c91e92abb1
 size 4983429624

 version https://git-lfs.github.com/spec/v1
+oid sha256:c9bd6c0780a60409335aa5db67a96b858e0c5cd0c5fcf9684a44d684cde40fb7
 size 4983429624

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9863ce817c5ffc2e4b49e71514981bd9e26e01bda1281d323450c2a91902ba3
 size 4065193744

 version https://git-lfs.github.com/spec/v1
+oid sha256:7aaedfb5091b9e1047962df0869c02dfbff66d71841aa617afcfaee761c560f7
 size 4065193744

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

recipe.yaml CHANGED Viewed

@@ -1,6 +1,6 @@
 DEFAULT_stage:
   DEFAULT_modifiers:
-    SmoothQuantModifier: {smoothing_strength: 0.8}
     GPTQModifier:
       scheme: W8A8
       targets: Linear

 DEFAULT_stage:
   DEFAULT_modifiers:
+    SmoothQuantModifier: {smoothing_strength: 0.5}
     GPTQModifier:
       scheme: W8A8
       targets: Linear