8000 Fix Qwen3MoE config parsing (#3336) · InternLM/lmdeploy@42167c8 · GitHub
[go: up one dir, main page]

Skip to content

Commit 42167c8

Browse files
authored
Fix Qwen3MoE config parsing (#3336)
* fix qwen3moe * fuck
1 parent 6fe9371 commit 42167c8

File tree

1 file changed

+14
-5
lines changed
  • lmdeploy/turbomind/deploy/source_model

1 file changed

+14
-5
lines changed

lmdeploy/turbomind/deploy/source_model/qwen.py

Lines changed: 14 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -149,9 +149,9 @@ def model_info(self):
149149
info['expert_inter_size'] = cfg['moe_intermediate_size']
150150
info['experts_per_token'] = cfg['num_experts_per_tok']
151151
info['inter_size'] = cfg['shared_expert_intermediate_size']
152-
info['moe_shared_gate'] = info['inter_size'] > 0
152+
info['moe_shared_gate'] = True
153153
info['norm_topk_prob'] = cfg['norm_topk_prob']
154-
info['attn_bias'] = cfg.get('attention_bias', 1)
154+
info['attn_bias'] = cfg.get('qkv_bias', 1)
155155
return info
156156

157157

@@ -170,8 +170,9 @@ class Qwen3Model(LlamaModel):
170170
Reader = Qwen3Reader
171171

172172
def model_info(self):
173+
cfg = self.model_config
173174
info = super().model_info()
174-
info['qk_norm'] = True
175+
info.update(qk_norm=True, attn_bias=cfg.get('attention_bias', 0))
175176
return info
176177

177178

@@ -186,10 +187,18 @@ def qk_norm(self, i: int):
186187

187188

188189
@INPUT_MODELS.register_module(name='qwen3-moe')
189-
class Qwen3MoeModel(Qwen2MoeModel):
190+
class Qwen3MoeModel(LlamaModel):
190191
Reader = Qwen3MoeReader
191192

192193
def model_info(self):
194+
cfg = self.model_config
193195
info = super().model_info()
194-
info['qk_norm'] = True
196+
info.update(
197+
qk_norm=True,
198+
expert_num=cfg.get('num_experts', 128),
199+
experts_per_token=cfg.get('num_experts_per_tok', 8),
200+
expert_inter_size=cfg.get('moe_intermediate_size', 768),
201+
attn_bias=cfg.get('attention_bias', 0),
202+
inter_size=0, # no shared expert
203+
norm_topk_prob=cfg.get('norm_topk_prob', False))
195204
return info

0 commit comments

Comments
 (0)
0