[AutoDeploy] fix: disable overlap scheduler until supported (#4365)

Signed-off-by: Lucas Liebenwein <11156568+lucaslie@users.noreply.github.com>
2026-01-14 06:27:45 +08:00 · 2025-05-15 19:19:30 -04:00 · 2025-05-15 19:19:30 -04:00 · 4883121477
commit 4883121477
parent c6e2111f4e
1 changed files with 3 additions and 0 deletions
--- a/tensorrt_llm/_torch/auto_deploy/shim/interface.py
+++ b/tensorrt_llm/_torch/auto_deploy/shim/interface.py
@ -120,3 +120,6 @@ class AutoDeployConfig(PyTorchConfig):
        # gets replaced by the user provided one. We don't want that though.
        f_default = self.__dataclass_fields__["model_kwargs"].default_factory()
        setattr(self, "model_kwargs", {**f_default, **getattr(self, "model_kwargs")})
+
+        # TODO (https://github.com/NVIDIA/TensorRT-LLM/issues/4364) support overlap scheduler
+        self.disable_overlap_scheduler = True