Skip to content

Commit 65a8889

Browse files
committed
Fix test
Signed-off-by: Chenjie Luo <chenjiel@nvidia.com>
1 parent 78046c4 commit 65a8889

1 file changed

Lines changed: 2 additions & 1 deletion

File tree

tests/gpu/torch/export/test_export.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -488,7 +488,8 @@ def test_qwen3_moe_nvfp4_experts_only_export_exclude_modules(tmp_path):
488488
model.config.architectures = ["Qwen3MoeForCausalLM"]
489489

490490
# Quantize with NVFP4_EXPERTS_ONLY_CFG (targets only *mlp.experts* patterns)
491-
mtq.quantize(model, NVFP4_EXPERTS_ONLY_CFG, lambda m: m(**m.dummy_inputs))
491+
dummy_inputs = {k: v.to("cuda") for k, v in model.dummy_inputs.items()}
492+
mtq.quantize(model, NVFP4_EXPERTS_ONLY_CFG, lambda m: m(**dummy_inputs))
492493

493494
# Export
494495
export_dir = tmp_path / "qwen3_moe_nvfp4_experts_only"

0 commit comments

Comments
 (0)