mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-05 02:31:33 +08:00
[None][chore] Reduce tedious logs (#10819)
Signed-off-by: Yanchao Lu <yanchaol@nvidia.com> Signed-off-by: Wangshanshan <30051912+dominicshanshan@users.noreply.github.com>
This commit is contained in:
parent
44aa6c3b8e
commit
18f63dfcec
@ -331,11 +331,11 @@ class Attention(nn.Module):
|
||||
key="sparse_attention_config")
|
||||
|
||||
if config.sparse_attention_config.algorithm == "rocket":
|
||||
logger.warning("disable rope_fusion for RocketKV.")
|
||||
logger.info_once("disable rope_fusion for RocketKV.")
|
||||
self.rope_fusion = False
|
||||
|
||||
if self.rope_fusion and not attn_cls.support_fused_rope():
|
||||
logger.warning(
|
||||
logger.info_once(
|
||||
"rope_fusion is true but the attention backend does not support it. Will disable rope_fusion."
|
||||
)
|
||||
self.rope_fusion = False
|
||||
|
||||
Loading…
Reference in New Issue
Block a user