fix ci

Edwardf0t1 · Edwardf0t1 · commit 840debf66497 · 2026-02-11T23:23:13.000-08:00
Signed-off-by: Zhiyu Cheng &lt;zhiyuc@nvidia.com&gt;
diff --git a/modelopt/torch/export/model_utils.py b/modelopt/torch/export/model_utils.py
@@ -148,9 +148,9 @@ def get_language_model_from_vl(model) -> list[nn.Module] | None:
         return [model, model.language_model]
 
     # Pattern 3: For encoder-decoder VL models (e.g., Nemotron-Parse), the decoder is the language model.
-    # Note: This is safe because this function is only called when the model is already detected as a VLM.
-    # Non-VLM encoder-decoder models (T5, Bart) won't reach this code path.
-    if hasattr(model, "decoder"):
+    # Only match if the model is detected as multimodal to avoid matching non-VLM encoder-decoder
+    # models like T5, Bart, Whisper which also have .decoder.
+    if hasattr(model, "decoder") and is_multimodal_model(model):
         return [model, model.decoder]
 
     # Pattern 4: No language_model found