[None][fix] Add missing absolute pe in Qwen3-VL Vision Encoder (#11065)

Signed-off-by: Necofish <liuxiangyang@mail.ustc.edu.cn>
2026-02-04 18:21:52 +08:00 · 2026-01-30 08:59:36 +08:00 · 2026-01-30 08:59:36 +08:00 · 144b61715f
commit 144b61715f
parent 54ba056924
1 changed files with 2 additions and 0 deletions
--- a/tensorrt_llm/_torch/models/modeling_qwen3vl.py
+++ b/tensorrt_llm/_torch/models/modeling_qwen3vl.py
@ -739,9 +739,11 @@ class Qwen3VisionModel(torch.nn.Module):

        # Getting positional embedding
        rotary_pos_emb = self.rot_pos_emb(grid_thw)
+        pos_embeds = self.fast_pos_embed_interpolate(grid_thw)

        # From this point, pure GPU operation
        hidden_states = self.patch_embed(pixel_values)
+        hidden_states = hidden_states + pos_embeds
        seq_len, _ = hidden_states.size()
        hidden_states = hidden_states.reshape(seq_len, -1)