beyoru
/

Qwen3-MaCoTo

Text Generation

Model card Files Files and versions

beyoru commited on Sep 7

Commit

ad207aa

·

verified ·

1 Parent(s): eff3035

Create qwen3_moe_config.py

Files changed (1) hide show

qwen3_moe_config.py +20 -0

qwen3_moe_config.py ADDED Viewed

	@@ -0,0 +1,20 @@

+from transformers import PretrainedConfig
+class Qwen3MoEConfig(PretrainedConfig):
+    model_type = "qwen3moe"
+    def __init__(
+        self,
+        router_model_path=None,
+        expert_model_paths=None,
+        labels=None,
+        torch_dtype="auto",
+        tokenizer_path=None,
+        **kwargs,
+    ):
+        super().__init__(**kwargs)
+        self.router_model_path = router_model_path
+        self.expert_model_paths = expert_model_paths or {}
+        self.labels = labels or []
+        self.torch_dtype = torch_dtype
+        self.tokenizer_path = tokenizer_path