From 2d80db4c3666f61093a10460b601cf6a37859b88 Mon Sep 17 00:00:00 2001 From: Frank <3429989+FrankD412@users.noreply.github.com> Date: Thu, 3 Apr 2025 00:00:29 -0700 Subject: [PATCH] chore: Remove build config from Pytorch kwargs. (#3210) Signed-off-by: Frank Di Natale <3429989+FrankD412@users.noreply.github.com> --- tensorrt_llm/bench/benchmark/throughput.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/tensorrt_llm/bench/benchmark/throughput.py b/tensorrt_llm/bench/benchmark/throughput.py index b7874f04b5..c17b368c25 100755 --- a/tensorrt_llm/bench/benchmark/throughput.py +++ b/tensorrt_llm/bench/benchmark/throughput.py @@ -23,7 +23,6 @@ from tensorrt_llm.bench.dataclasses.general import BenchmarkEnvironment from tensorrt_llm.bench.dataclasses.reporting import ReportUtility from tensorrt_llm.bench.utils.data import (create_dataset_from_stream, initialize_tokenizer) -from tensorrt_llm.builder import BuildConfig from tensorrt_llm.llmapi.llm import LLM from tensorrt_llm.logger import logger from tensorrt_llm.sampling_params import SamplingParams @@ -227,7 +226,7 @@ def throughput_command( bench_env.checkpoint_path) kwargs_max_sql = max_seq_len or metadata.max_sequence_length logger.info(f"Setting PyTorch max sequence length to {kwargs_max_sql}") - kwargs["build_config"] = BuildConfig(max_seq_len=kwargs_max_sql, ) + kwargs["max_seq_len"] = kwargs_max_sql else: assert max_seq_len is None, ( "max_seq_len is not a runtime parameter for C++ backend")