File tree Expand file tree Collapse file tree 2 files changed +13
-1
lines changed
Expand file tree Collapse file tree 2 files changed +13
-1
lines changed Original file line number Diff line number Diff line change 204204 "quantization" : "4bit" ,
205205 "alias" : "qwen3-moe-30b" ,
206206 },
207+ {
208+ "id" : "mlx-community/Qwen3-Coder-30B-A3B-Instruct-4bit" ,
209+ "arch" : "qwen3_moe" ,
210+ "quantization" : "4bit" ,
211+ "alias" : "qwen3-moe-30b" ,
212+ },
213+ {
214+ "id" : "mlx-community/Qwen3-Coder-30B-A3B-Instruct-8bit" ,
215+ "arch" : "qwen3_moe" ,
216+ "quantization" : "8bit" ,
217+ "alias" : "qwen3-moe-30b" ,
218+ },
207219 ]
208220}
Original file line number Diff line number Diff line change @@ -14,7 +14,7 @@ def __init__(self, args: ModelArgs):
1414 self .num_experts = args .num_experts
1515 self .gate = nn .Linear (args .hidden_size , self .num_experts , bias = False )
1616 self .switch_mlp = SwitchGLU (
17- args .hidden_size , args .intermediate_size , self .num_experts
17+ args .hidden_size , args .moe_intermediate_size , self .num_experts
1818 )
1919
2020 def __call__ (self , x : mx .array ):
You can’t perform that action at this time.
0 commit comments