mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
[AutoDeploy] fix: disable overlap scheduler until supported (#4365)
Signed-off-by: Lucas Liebenwein <11156568+lucaslie@users.noreply.github.com>
This commit is contained in:
parent
c6e2111f4e
commit
4883121477
@ -120,3 +120,6 @@ class AutoDeployConfig(PyTorchConfig):
|
||||
# gets replaced by the user provided one. We don't want that though.
|
||||
f_default = self.__dataclass_fields__["model_kwargs"].default_factory()
|
||||
setattr(self, "model_kwargs", {**f_default, **getattr(self, "model_kwargs")})
|
||||
|
||||
# TODO (https://github.com/NVIDIA/TensorRT-LLM/issues/4364) support overlap scheduler
|
||||
self.disable_overlap_scheduler = True
|
||||
|
||||
Loading…
Reference in New Issue
Block a user