mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-02-05 02:31:33 +08:00
[None][chore] Reduce tedious logs (#10847)
Signed-off-by: Yanchao Lu <yanchaol@nvidia.com>
This commit is contained in:
parent
3a894951e7
commit
ae8f74b620
@ -334,11 +334,11 @@ class Attention(nn.Module):
|
||||
key="sparse_attention_config")
|
||||
|
||||
if config.sparse_attention_config.algorithm == "rocket":
|
||||
logger.warning("disable rope_fusion for RocketKV.")
|
||||
logger.info_once("disable rope_fusion for RocketKV.")
|
||||
self.rope_fusion = False
|
||||
|
||||
if self.rope_fusion and not attn_cls.support_fused_rope():
|
||||
logger.warning(
|
||||
logger.info_once(
|
||||
"rope_fusion is true but the attention backend does not support it. Will disable rope_fusion."
|
||||
)
|
||||
self.rope_fusion = False
|
||||
|
||||
Loading…
Reference in New Issue
Block a user