[https://nvbugs/5433545][fix] TestPhi4MiniInstruct::test_auto_dtype - Use max_seq_len=4096 to fallback to the short RoPE factor (#6895)

Signed-off-by: Michal Guzek <mguzek@nvidia.com>
This commit is contained in:
Michal Guzek 2025-08-22 10:28:09 -07:00 committed by GitHub
parent 4b6cca0662
commit 7ea53ff516
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -2334,7 +2334,7 @@ class TestPhi4MiniInstruct(LlmapiAccuracyTestHarness):
MODEL_PATH = f"{llm_models_root()}/Phi-4-mini-instruct"
def test_auto_dtype(self):
with LLM(self.MODEL_PATH) as llm:
with LLM(self.MODEL_PATH, max_seq_len=4096) as llm:
task = CnnDailymail(self.MODEL_NAME)
task.evaluate(llm)
task = MMLU(self.MODEL_NAME)