We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 78046c4 commit 65a8889Copy full SHA for 65a8889
1 file changed
tests/gpu/torch/export/test_export.py
@@ -488,7 +488,8 @@ def test_qwen3_moe_nvfp4_experts_only_export_exclude_modules(tmp_path):
488
model.config.architectures = ["Qwen3MoeForCausalLM"]
489
490
# Quantize with NVFP4_EXPERTS_ONLY_CFG (targets only *mlp.experts* patterns)
491
- mtq.quantize(model, NVFP4_EXPERTS_ONLY_CFG, lambda m: m(**m.dummy_inputs))
+ dummy_inputs = {k: v.to("cuda") for k, v in model.dummy_inputs.items()}
492
+ mtq.quantize(model, NVFP4_EXPERTS_ONLY_CFG, lambda m: m(**dummy_inputs))
493
494
# Export
495
export_dir = tmp_path / "qwen3_moe_nvfp4_experts_only"
0 commit comments