mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
223 lines
3.5 KiB
ReStructuredText
223 lines
3.5 KiB
ReStructuredText
Runtime
|
|
==========
|
|
|
|
.. Here are files in the cpp/include/runtime
|
|
.. We manually add subsection to enable detailed description in the future
|
|
.. It is also doable to automatically generate this file and list all the modules in the conf.py
|
|
lookaheadBuffers.h
|
|
__________________
|
|
|
|
.. doxygenfile:: lookaheadBuffers.h
|
|
:project: TensorRT-LLM
|
|
|
|
lookaheadModule.h
|
|
_________________
|
|
|
|
.. doxygenfile:: lookaheadModule.h
|
|
:project: TensorRT-LLM
|
|
|
|
iBuffer.h
|
|
_________
|
|
|
|
.. doxygenfile:: iBuffer.h
|
|
:project: TensorRT-LLM
|
|
|
|
modelConfig.h
|
|
_____________
|
|
|
|
.. doxygenfile:: modelConfig.h
|
|
:project: TensorRT-LLM
|
|
|
|
decodingOutput.h
|
|
________________
|
|
|
|
.. doxygenfile:: decodingOutput.h
|
|
:project: TensorRT-LLM
|
|
|
|
promptTuningParams.h
|
|
____________________
|
|
|
|
.. doxygenfile:: promptTuningParams.h
|
|
:project: TensorRT-LLM
|
|
|
|
bufferManager.h
|
|
_______________
|
|
|
|
.. doxygenfile:: bufferManager.h
|
|
:project: TensorRT-LLM
|
|
|
|
gptJsonConfig.h
|
|
_______________
|
|
|
|
.. doxygenfile:: gptJsonConfig.h
|
|
:project: TensorRT-LLM
|
|
|
|
runtimeDefaults.h
|
|
_________________
|
|
|
|
.. doxygenfile:: runtimeDefaults.h
|
|
:project: TensorRT-LLM
|
|
|
|
loraCache.h
|
|
___________
|
|
|
|
.. doxygenfile:: loraCache.h
|
|
:project: TensorRT-LLM
|
|
|
|
rawEngine.h
|
|
___________
|
|
|
|
.. doxygenfile:: rawEngine.h
|
|
:project: TensorRT-LLM
|
|
|
|
gptDecoder.h
|
|
____________
|
|
|
|
.. doxygenfile:: gptDecoder.h
|
|
:project: TensorRT-LLM
|
|
|
|
eagleBuffers.h
|
|
______________
|
|
|
|
.. doxygenfile:: eagleBuffers.h
|
|
:project: TensorRT-LLM
|
|
|
|
medusaModule.h
|
|
______________
|
|
|
|
.. doxygenfile:: medusaModule.h
|
|
:project: TensorRT-LLM
|
|
|
|
virtualMemory.h
|
|
_______________
|
|
|
|
.. doxygenfile:: virtualMemory.h
|
|
:project: TensorRT-LLM
|
|
|
|
explicitDraftTokensBuffers.h
|
|
____________________________
|
|
|
|
.. doxygenfile:: explicitDraftTokensBuffers.h
|
|
:project: TensorRT-LLM
|
|
|
|
iTensor.h
|
|
_________
|
|
|
|
.. doxygenfile:: iTensor.h
|
|
:project: TensorRT-LLM
|
|
|
|
common.h
|
|
________
|
|
|
|
.. doxygenfile:: common.h
|
|
:project: TensorRT-LLM
|
|
|
|
loraCachePageManagerConfig.h
|
|
____________________________
|
|
|
|
.. doxygenfile:: loraCachePageManagerConfig.h
|
|
:project: TensorRT-LLM
|
|
|
|
worldConfig.h
|
|
_____________
|
|
|
|
.. doxygenfile:: worldConfig.h
|
|
:project: TensorRT-LLM
|
|
|
|
loraModule.h
|
|
____________
|
|
|
|
.. doxygenfile:: loraModule.h
|
|
:project: TensorRT-LLM
|
|
|
|
speculativeDecodingMode.h
|
|
_________________________
|
|
|
|
.. doxygenfile:: speculativeDecodingMode.h
|
|
:project: TensorRT-LLM
|
|
|
|
cudaEvent.h
|
|
___________
|
|
|
|
.. doxygenfile:: cudaEvent.h
|
|
:project: TensorRT-LLM
|
|
|
|
decodingInput.h
|
|
_______________
|
|
|
|
.. doxygenfile:: decodingInput.h
|
|
:project: TensorRT-LLM
|
|
|
|
speculativeDecodingModule.h
|
|
___________________________
|
|
|
|
.. doxygenfile:: speculativeDecodingModule.h
|
|
:project: TensorRT-LLM
|
|
|
|
iGptDecoderBatched.h
|
|
____________________
|
|
|
|
.. doxygenfile:: iGptDecoderBatched.h
|
|
:project: TensorRT-LLM
|
|
|
|
eagleModule.h
|
|
_____________
|
|
|
|
.. doxygenfile:: eagleModule.h
|
|
:project: TensorRT-LLM
|
|
|
|
tllmLogger.h
|
|
____________
|
|
|
|
.. doxygenfile:: tllmLogger.h
|
|
:project: TensorRT-LLM
|
|
|
|
gptDecoderBatched.h
|
|
___________________
|
|
|
|
.. doxygenfile:: gptDecoderBatched.h
|
|
:project: TensorRT-LLM
|
|
|
|
cudaStream.h
|
|
____________
|
|
|
|
.. doxygenfile:: cudaStream.h
|
|
:project: TensorRT-LLM
|
|
|
|
ipcNvlsMemory.h
|
|
_______________
|
|
|
|
.. doxygenfile:: ipcNvlsMemory.h
|
|
:project: TensorRT-LLM
|
|
|
|
samplingConfig.h
|
|
________________
|
|
|
|
.. doxygenfile:: samplingConfig.h
|
|
:project: TensorRT-LLM
|
|
|
|
request.h
|
|
_________
|
|
|
|
.. doxygenfile:: request.h
|
|
:project: TensorRT-LLM
|
|
|
|
decoderState.h
|
|
______________
|
|
|
|
.. doxygenfile:: decoderState.h
|
|
:project: TensorRT-LLM
|
|
|
|
ipcUtils.h
|
|
__________
|
|
|
|
.. doxygenfile:: ipcUtils.h
|
|
:project: TensorRT-LLM
|
|
|
|
memoryCounters.h
|
|
________________
|
|
|
|
.. doxygenfile:: memoryCounters.h
|
|
:project: TensorRT-LLM
|
|
|