diff --git a/tensorrt_llm/_torch/models/modeling_qwen3vl.py b/tensorrt_llm/_torch/models/modeling_qwen3vl.py
index 4bdcfc7678..e9f77153d9 100644
--- a/tensorrt_llm/_torch/models/modeling_qwen3vl.py
+++ b/tensorrt_llm/_torch/models/modeling_qwen3vl.py
@@ -739,9 +739,11 @@ class Qwen3VisionModel(torch.nn.Module):
 
         # Getting positional embedding
         rotary_pos_emb = self.rot_pos_emb(grid_thw)
+        pos_embeds = self.fast_pos_embed_interpolate(grid_thw)
 
         # From this point, pure GPU operation
         hidden_states = self.patch_embed(pixel_values)
+        hidden_states = hidden_states + pos_embeds
         seq_len, _ = hidden_states.size()
         hidden_states = hidden_states.reshape(seq_len, -1)