mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-18 00:35:04 +08:00
[https://nvbugs/5644187][fix] Llava-Next MMMU bugfix and Phi4 test bugfix (#9034)
Signed-off-by: yechank <161688079+yechank-nvidia@users.noreply.github.com>
This commit is contained in:
parent
f40e1f7496
commit
0938a3ad2a
@ -4,7 +4,7 @@ Qwen/Qwen2.5-VL-7B-Instruct:
|
||||
- accuracy: 51.22
|
||||
nvidia/Nano-v2-VLM:
|
||||
- accuracy: 43.78
|
||||
llava-hf/llava-v1.6-mistral-7b:
|
||||
llava-hf/llava-v1.6-mistral-7b-hf:
|
||||
- accuracy: 35.33
|
||||
Efficient-Large-Model/NVILA-8B:
|
||||
- accuracy: 47.77
|
||||
|
||||
@ -80,8 +80,8 @@ class TestNano_V2_VLM(LlmapiAccuracyTestHarness):
|
||||
|
||||
|
||||
class TestLlava_V1_6_Mistral_7B(LlmapiAccuracyTestHarness):
|
||||
MODEL_NAME = "llava-hf/llava-v1.6-mistral-7b"
|
||||
MODEL_PATH = f"{llm_models_root()}/llava-v1.6-mistral-7b"
|
||||
MODEL_NAME = "llava-hf/llava-v1.6-mistral-7b-hf"
|
||||
MODEL_PATH = f"{llm_models_root()}/llava-v1.6-mistral-7b-hf"
|
||||
MAX_NUM_TOKENS = 16384
|
||||
|
||||
# NOTE: MMMU adds <|endoftext|> to the stop token.
|
||||
|
||||
@ -2658,7 +2658,7 @@ def test_ptp_quickstart_multimodal_kv_cache_reuse(llm_root, llm_venv,
|
||||
],
|
||||
] * num_same_requests,
|
||||
},
|
||||
"phi4-multimodal-instruct-fp8": {
|
||||
"phi4-multimodal-instruct": {
|
||||
"image": [
|
||||
[
|
||||
"image", "depicts", "natural", "environment", "ocean",
|
||||
|
||||
Loading…
Reference in New Issue
Block a user