[https://nvbugs/5854419][fix] Fix Qwen3-VL-Dense/MoE accuracy drop (#11134)

Signed-off-by: yechank <161688079+yechank-nvidia@users.noreply.github.com> Signed-off-by: Wangshanshan <30051912+dominicshanshan@users.noreply.github.com>
2026-02-18 08:45:05 +08:00 · 2026-02-03 18:59:44 +09:00 · 2026-02-03 18:59:44 +09:00 · ebd859cf61
commit ebd859cf61
parent 435ea36977
2 changed files with 2 additions and 0 deletions
--- a/tensorrt_llm/_torch/models/modeling_qwen3vl.py
+++ b/tensorrt_llm/_torch/models/modeling_qwen3vl.py
@ -1138,6 +1138,7 @@ class Qwen3VLModelBase(PreTrainedModel):
            "video": "<|vision_start|><|video_pad|><|vision_end|>",
        },
        placeholder_placement=MultimodalPlaceholderPlacement.BEFORE_TEXT,
+        placeholders_separator="",
    ),
 )
 class Qwen3VLModel(Qwen3VLModelBase):
--- a/tensorrt_llm/_torch/models/modeling_qwen3vl_moe.py
+++ b/tensorrt_llm/_torch/models/modeling_qwen3vl_moe.py
@ -41,6 +41,7 @@ from .modeling_utils import ModelConfig, register_auto_model, register_vision_en
            "video": "<|vision_start|><|video_pad|><|vision_end|>",
        },
        placeholder_placement=MultimodalPlaceholderPlacement.BEFORE_TEXT,
+        placeholders_separator="",
    ),
 )
 class Qwen3MoeVLModel(Qwen3VLModelBase):