mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
feat : reduce trt engine build time in testing (#3014)
Signed-off-by: peaceh <103117813+peaceh-nv@users.noreply.github.com>
This commit is contained in:
parent
1ac0566a93
commit
5e272eef81
@ -754,7 +754,9 @@ class TestFunctional(unittest.TestCase):
|
||||
precision=dtype,
|
||||
int8=int8_trt_flag,
|
||||
quant_mode=quant_mode)
|
||||
|
||||
# Reuce the TRT engine build time by setting the max allowed number of tactics in builder tactic profiling.
|
||||
if builder_config.trt_builder_config.max_num_tactics == -1:
|
||||
builder_config.trt_builder_config.max_num_tactics = 30
|
||||
if session is None:
|
||||
engine = builder.build_engine(net, builder_config)
|
||||
session = tensorrt_llm.runtime.Session.from_serialized_engine(
|
||||
|
||||
Loading…
Reference in New Issue
Block a user