From ef05ec0aab42aec7566dac0f1b1e12be466a33fe Mon Sep 17 00:00:00 2001 From: "He, Xin3" Date: Wed, 21 Jan 2026 17:13:44 +0800 Subject: [PATCH 1/2] align act_max of experts for qwen3-vl and qwen3-next Signed-off-by: He, Xin3 --- auto_round/utils/model.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/auto_round/utils/model.py b/auto_round/utils/model.py index f4c6e7b75..25208e6a1 100644 --- a/auto_round/utils/model.py +++ b/auto_round/utils/model.py @@ -613,6 +613,8 @@ def is_moe_layer(module: torch.nn.Module) -> bool: "DeepseekV3MoE".lower(), "Qwen2MoeSparseMoeBlock".lower(), "Qwen3MoeSparseMoeBlock".lower(), + "Qwen3NextSparseMoeBlock".lower(), + "Qwen3VLMoeTextSparseMoeBlock".lower(), ] ) @@ -722,7 +724,7 @@ def module_match_name_list(module, name_list): return any(name.lower() in type(module).__name__.lower() for name in name_list) if module_match_name_list( - module, ["Qwen2MoeSparseMoeBlock", "Qwen3MoeSparseMoeBlock", "DeepseekMoE", "DeepseekV2MoE", "DeepseekV3MoE"] + module, ["Qwen2MoeSparseMoeBlock", "Qwen3MoeSparseMoeBlock", "Qwen3NextSparseMoeBlock", "Qwen3VLMoeTextSparseMoeBlock", "DeepseekMoE", "DeepseekV2MoE", "DeepseekV3MoE"] ): return ["gate_proj", "down_proj", "up_proj"] elif module_match_name_list(module, ["MixtralMoeSparseMoeBlock"]): From 6f5ed28925edfefb8a3888e0d6d3e2ba91ac1071 Mon Sep 17 00:00:00 2001 From: "pre-commit-ci[bot]" <66853113+pre-commit-ci[bot]@users.noreply.github.com> Date: Wed, 21 Jan 2026 09:15:51 +0000 Subject: [PATCH 2/2] [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci --- auto_round/utils/model.py | 11 ++++++++++- 1 file changed, 10 insertions(+), 1 deletion(-) diff --git a/auto_round/utils/model.py b/auto_round/utils/model.py index 25208e6a1..da34dd9b7 100644 --- a/auto_round/utils/model.py +++ b/auto_round/utils/model.py @@ -724,7 +724,16 @@ def module_match_name_list(module, name_list): return any(name.lower() in type(module).__name__.lower() for name in name_list) if module_match_name_list( - module, ["Qwen2MoeSparseMoeBlock", "Qwen3MoeSparseMoeBlock", "Qwen3NextSparseMoeBlock", "Qwen3VLMoeTextSparseMoeBlock", "DeepseekMoE", "DeepseekV2MoE", "DeepseekV3MoE"] + module, + [ + "Qwen2MoeSparseMoeBlock", + "Qwen3MoeSparseMoeBlock", + "Qwen3NextSparseMoeBlock", + "Qwen3VLMoeTextSparseMoeBlock", + "DeepseekMoE", + "DeepseekV2MoE", + "DeepseekV3MoE", + ], ): return ["gate_proj", "down_proj", "up_proj"] elif module_match_name_list(module, ["MixtralMoeSparseMoeBlock"]):