mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-05 18:51:38 +08:00
[https://nvbugs/5836592][fix] Fix qwen3 eagle test (#11030)
Signed-off-by: Mike Iovine <miovine@nvidia.com>
This commit is contained in:
parent
a4880ffdbb
commit
0ad87895f5
@ -3720,8 +3720,8 @@ class TestQwen3_4B(LlmapiAccuracyTestHarness):
|
||||
target_model_dir = f"{llm_models_root()}/Qwen3/Qwen3-4B"
|
||||
|
||||
draft_len = 3
|
||||
spec_config = EagleDecodingConfig(max_draft_len=draft_len,
|
||||
speculative_model_dir=eagle_model_dir)
|
||||
spec_config = Eagle3DecodingConfig(
|
||||
max_draft_len=draft_len, speculative_model_dir=eagle_model_dir)
|
||||
|
||||
with LLM(model=target_model_dir,
|
||||
**pytorch_config,
|
||||
|
||||
Loading…
Reference in New Issue
Block a user