/* * SPDX-FileCopyrightText: Copyright (c) 2023 NVIDIA CORPORATION & AFFILIATES. All rights reserved. * SPDX-License-Identifier: LicenseRef-NvidiaProprietary * * NVIDIA CORPORATION, its affiliates and licensors retain all intellectual * property and proprietary rights in and to this material, related * documentation and any modifications thereto. Any use, reproduction, * disclosure or distribution of this material and related documentation * without an express license agreement from NVIDIA CORPORATION or * its affiliates is strictly prohibited. */ #pragma once #include "tensorrt_llm/runtime/common.h" #include "tensorrt_llm/runtime/iTensor.h" #include "tensorrt_llm/runtime/modelConfig.h" #include "tensorrt_llm/runtime/worldConfig.h" namespace tensorrt_llm::runtime::lora { SizeType32 constexpr kLORA_CONFIG_ROW_SIZE = 3; SizeType32 constexpr kLORA_CONFIG_MODULE_OFF = 0; SizeType32 constexpr kLORA_CONFIG_LAYER_OFF = 1; SizeType32 constexpr kLORA_CONFIG_ADAPTER_SIZE_OFF = 2; SizeType32 constexpr kLORA_NUM_WEIGHTS_POINTERS = 2; void loraValidateRequestTensorDims(std::optional const& optReqLoraWeights, std::optional const& optReqLoraConfig); void loraValidateRequestTensors(std::optional const& optTaskId, std::optional const& optReqLoraWeights, std::optional const& optReqLoraConfig, runtime::ModelConfig const& modelConfig, runtime::WorldConfig const& worldConfig); } // namespace tensorrt_llm::runtime::lora