base_model: Qwen/Qwen2.5-7B gate_mode: random dtype: bfloat16 experts: - source_model: Qwen/Qwen2.5-Coder-7B positive_prompts: - "code" - "python" - "javascript" - "programming" - "algorithm" - source_model: Qwen/Qwen2.5-Math-7B positive_prompts: - "math" - "calculus" - "algebra" - "geometry" - "trigonometry" - "reason" - "mathematics" - "solve" - "count" shared_experts: - source_model: Qwen/Qwen2.5-7B positive_prompts: - "chat" - "assistant" - "fact" residual_scale: 0.1