fix qwen3_moe switch_glu object

GandalfTea · GandalfTea · commit a2e676bdea86 · 2025-11-27T00:13:08.000-08:00
diff --git a/src/dnet/api/catalog.py b/src/dnet/api/catalog.py
@@ -204,5 +204,17 @@
             "quantization": "4bit",
             "alias": "qwen3-moe-30b",
         },
+        {
+            "id": "mlx-community/Qwen3-Coder-30B-A3B-Instruct-4bit",
+            "arch": "qwen3_moe",
+            "quantization": "4bit",
+            "alias": "qwen3-moe-30b",
+        },
+        {
+            "id": "mlx-community/Qwen3-Coder-30B-A3B-Instruct-8bit",
+            "arch": "qwen3_moe",
+            "quantization": "8bit",
+            "alias": "qwen3-moe-30b",
+        },
     ]
 }
diff --git a/src/dnet/core/models/qwen3_moe.py b/src/dnet/core/models/qwen3_moe.py
@@ -14,7 +14,7 @@ def __init__(self, args: ModelArgs):
         self.num_experts = args.num_experts
         self.gate = nn.Linear(args.hidden_size, self.num_experts, bias=False)
         self.switch_mlp = SwitchGLU(
-            args.hidden_size, args.intermediate_size, self.num_experts
+            args.hidden_size, args.moe_intermediate_size, self.num_experts
         )
 
     def __call__(self, x: mx.array):

Original file line number	Diff line number	Diff line change
`@@ -14,7 +14,7 @@ def __init__(self, args: ModelArgs):`
`14`	`14`	`self.num_experts = args.num_experts`
`15`	`15`	`self.gate = nn.Linear(args.hidden_size, self.num_experts, bias=False)`
`16`	`16`	`self.switch_mlp = SwitchGLU(`
`17`		`- args.hidden_size, args.intermediate_size, self.num_experts`
	`17`	`+ args.hidden_size, args.moe_intermediate_size, self.num_experts`
`18`	`18`	`)`
`19`	`19`
`20`	`20`	`def __call__(self, x: mx.array):`