diff --git a/tests/unittest/_torch/auto_deploy/unit/singlegpu/models/test_llama4_vlm_patch.py b/tests/unittest/_torch/auto_deploy/unit/singlegpu/models/test_llama4_vlm_patch.py index 40f118b18d..51ff13fac3 100644 --- a/tests/unittest/_torch/auto_deploy/unit/singlegpu/models/test_llama4_vlm_patch.py +++ b/tests/unittest/_torch/auto_deploy/unit/singlegpu/models/test_llama4_vlm_patch.py @@ -1,3 +1,4 @@ +import pytest import torch from _model_test_utils import get_small_model_config from build_and_run_ad import ExperimentConfig @@ -8,6 +9,7 @@ from tensorrt_llm._torch.auto_deploy.export import apply_export_patches, torch_e from tensorrt_llm._torch.auto_deploy.transformations._graph import move_to_device +@pytest.mark.skip(reason="https://nvbugspro.nvidia.com/bug/5505835") def test_build_run_llama4_vlm(): atol = 1e-3 rtol = 1e-3