TensorRT-LLMs/tensorrt_llm/_torch/cublaslt_utils.py
2025-10-23 15:55:10 +08:00

19 lines
604 B
Python

# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
from ..logger import logger
IS_CUBLASLT_AVAILABLE = False
# Check cuBLASLt availability
try:
import torch
# Check if CublasLtFP4GemmRunner (used by nvfp4_gemm_cublaslt) is available
if hasattr(torch.classes, 'trtllm') and hasattr(torch.classes.trtllm,
'CublasLtFP4GemmRunner'):
logger.info(f"cuBLASLt FP4 GEMM is available")
IS_CUBLASLT_AVAILABLE = True
except ImportError:
pass