TensorRT-LLMs/cpp/include/tensorrt_llm/deep_gemm/utils.cuh
Gabriel Wu 376731013d
feat: use NVRTC for DeepGEMM JIT compilation (#3239)
* feat: use NVRTC for DeepGEMM JIT compilation

Signed-off-by: Zihua Wu 

* fix: add license

Signed-off-by: Zihua Wu

* feat: store NVRTC JIT results in memory by default

Signed-off-by: Zihua Wu


* feat: refinement

Signed-off-by: Zihua Wu

* feat: refinement

Signed-off-by: Zihua Wu

* test: set timeout to 7200

Signed-off-by: Zihua Wu

---------

Signed-off-by: Zihua Wu
2025-04-07 20:29:23 +08:00

87 lines
3.5 KiB
Plaintext

/*
* SPDX-FileCopyrightText: Copyright (c) 2025 DeepSeek
* SPDX-License-Identifier: MIT
*
* Licensed under the MIT License.
* You may obtain a copy of the License at
*
* https://opensource.org/licenses/MIT
*
*
* SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
* SPDX-License-Identifier: Apache-2.0
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#pragma once
#ifndef NVRTC_JIT_COMPILATION
#include <exception>
class AssertionException : public std::exception
{
private:
std::string message{};
public:
explicit AssertionException(std::string const& message)
: message(message)
{
}
char const* what() const noexcept override
{
return message.c_str();
}
};
#endif
#ifndef DG_HOST_ASSERT
#ifdef NVRTC_JIT_COMPILATION
#define DG_HOST_ASSERT(cond) ((void) 0)
#else
#define DG_HOST_ASSERT(cond) \
do \
{ \
if (not(cond)) \
{ \
printf("Assertion failed: %s:%d, condition: %s\n", __FILE__, __LINE__, #cond); \
throw AssertionException("Assertion failed: " #cond); \
} \
} while (0)
#endif
#endif
#ifndef DG_DEVICE_ASSERT
#define DG_DEVICE_ASSERT(cond) \
do \
{ \
if (not(cond)) \
{ \
printf("Assertion failed: %s:%d, condition: %s\n", __FILE__, __LINE__, #cond); \
asm("trap;"); \
} \
} while (0)
#endif
#ifndef DG_STATIC_ASSERT
#define DG_STATIC_ASSERT(cond, reason) static_assert(cond, reason)
#endif
template <typename T>
__device__ __host__ constexpr T ceil_div(T a, T b)
{
return (a + b - 1) / b;
}