From 435ea36977dbf4611456e94a9e87837f838824df Mon Sep 17 00:00:00 2001 From: Mike Iovine Date: Mon, 2 Feb 2026 10:35:51 -0500 Subject: [PATCH] [None][chore] Add warning about 2-model MTP deprecation (#11043) Signed-off-by: Mike Iovine Signed-off-by: Wangshanshan <30051912+dominicshanshan@users.noreply.github.com> --- tensorrt_llm/llmapi/llm_args.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/tensorrt_llm/llmapi/llm_args.py b/tensorrt_llm/llmapi/llm_args.py index f5c16b9d9c..0b4d4e60f2 100644 --- a/tensorrt_llm/llmapi/llm_args.py +++ b/tensorrt_llm/llmapi/llm_args.py @@ -1183,6 +1183,12 @@ class MTPDecodingConfig(DecodingBaseConfig): self.max_total_draft_tokens = kwargs[ 'num_nextn_predict_layers'] # Current MTP only support linear tree + if not self.mtp_eagle_one_model: + logger.warning( + "2-model style MTP is deprecated. The mtp_eagle_one_model flag will do nothing " + "in release 1.3. After that, the flag will be removed entirely." + ) + @classmethod def from_dict(cls, data: dict): out = cls(**data)