diff --git a/tests/unittest/llmapi/test_llm.py b/tests/unittest/llmapi/test_llm.py index 2c7a7642f0..7369c72fa9 100644 --- a/tests/unittest/llmapi/test_llm.py +++ b/tests/unittest/llmapi/test_llm.py @@ -228,6 +228,7 @@ def test_llm_loading_from_hf(): kv_cache_config=global_kvcache_config) +@pytest.mark.skip(reason="https://nvbugs/5266240") @force_ampere @pytest.mark.part0 def test_llm_loading_from_ckpt(): @@ -246,7 +247,11 @@ def test_llm_loading_from_ckpt(): sampling_params=SamplingParams(max_tokens=8)) -@pytest.mark.parametrize('model_format', ['hf', 'ckpt']) +@pytest.mark.parametrize('model_format', [ + 'hf', + pytest.param('ckpt', + marks=pytest.mark.skip(reason="https://nvbugs/5266240")) +]) @pytest.mark.part0 def test_llm_with_dummy_weights(model_format): # dummy_dir contains config.json and tokenizer files only