mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-18 08:45:05 +08:00
[https://nvbugs/5854419][fix] Fix Qwen3-VL-Dense/MoE accuracy drop (#11134)
Signed-off-by: yechank <161688079+yechank-nvidia@users.noreply.github.com> Signed-off-by: Wangshanshan <30051912+dominicshanshan@users.noreply.github.com>
This commit is contained in:
parent
435ea36977
commit
ebd859cf61
@ -1138,6 +1138,7 @@ class Qwen3VLModelBase(PreTrainedModel):
|
||||
"video": "<|vision_start|><|video_pad|><|vision_end|>",
|
||||
},
|
||||
placeholder_placement=MultimodalPlaceholderPlacement.BEFORE_TEXT,
|
||||
placeholders_separator="",
|
||||
),
|
||||
)
|
||||
class Qwen3VLModel(Qwen3VLModelBase):
|
||||
|
||||
@ -41,6 +41,7 @@ from .modeling_utils import ModelConfig, register_auto_model, register_vision_en
|
||||
"video": "<|vision_start|><|video_pad|><|vision_end|>",
|
||||
},
|
||||
placeholder_placement=MultimodalPlaceholderPlacement.BEFORE_TEXT,
|
||||
placeholders_separator="",
|
||||
),
|
||||
)
|
||||
class Qwen3MoeVLModel(Qwen3VLModelBase):
|
||||
|
||||
Loading…
Reference in New Issue
Block a user