Runtime
==========

.. Here are files in the cpp/include/runtime
.. We manually add subsection to enable detailed description in the future
.. It is also doable to automatically generate this file and list all the modules in the conf.py
lookaheadBuffers.h
__________________

.. doxygenfile:: lookaheadBuffers.h
   :project: TensorRT-LLM

lookaheadModule.h
_________________

.. doxygenfile:: lookaheadModule.h
   :project: TensorRT-LLM

iBuffer.h
_________

.. doxygenfile:: iBuffer.h
   :project: TensorRT-LLM

modelConfig.h
_____________

.. doxygenfile:: modelConfig.h
   :project: TensorRT-LLM

iStatefulGptDecoder.h
_____________________

.. doxygenfile:: iStatefulGptDecoder.h
   :project: TensorRT-LLM

generationInput.h
_________________

.. doxygenfile:: generationInput.h
   :project: TensorRT-LLM

gptSession.h
____________

.. doxygenfile:: gptSession.h
   :project: TensorRT-LLM

decodingOutput.h
________________

.. doxygenfile:: decodingOutput.h
   :project: TensorRT-LLM

promptTuningParams.h
____________________

.. doxygenfile:: promptTuningParams.h
   :project: TensorRT-LLM

bufferManager.h
_______________

.. doxygenfile:: bufferManager.h
   :project: TensorRT-LLM

gptJsonConfig.h
_______________

.. doxygenfile:: gptJsonConfig.h
   :project: TensorRT-LLM

runtimeDefaults.h
_________________

.. doxygenfile:: runtimeDefaults.h
   :project: TensorRT-LLM

loraCache.h
___________

.. doxygenfile:: loraCache.h
   :project: TensorRT-LLM

rawEngine.h
___________

.. doxygenfile:: rawEngine.h
   :project: TensorRT-LLM

gptDecoder.h
____________

.. doxygenfile:: gptDecoder.h
   :project: TensorRT-LLM

eagleBuffers.h
______________

.. doxygenfile:: eagleBuffers.h
   :project: TensorRT-LLM

medusaModule.h
______________

.. doxygenfile:: medusaModule.h
   :project: TensorRT-LLM

explicitDraftTokensBuffers.h
____________________________

.. doxygenfile:: explicitDraftTokensBuffers.h
   :project: TensorRT-LLM

iTensor.h
_________

.. doxygenfile:: iTensor.h
   :project: TensorRT-LLM

common.h
________

.. doxygenfile:: common.h
   :project: TensorRT-LLM

loraCachePageManagerConfig.h
____________________________

.. doxygenfile:: loraCachePageManagerConfig.h
   :project: TensorRT-LLM

worldConfig.h
_____________

.. doxygenfile:: worldConfig.h
   :project: TensorRT-LLM

loraModule.h
____________

.. doxygenfile:: loraModule.h
   :project: TensorRT-LLM

speculativeDecodingMode.h
_________________________

.. doxygenfile:: speculativeDecodingMode.h
   :project: TensorRT-LLM

cudaEvent.h
___________

.. doxygenfile:: cudaEvent.h
   :project: TensorRT-LLM

decodingInput.h
_______________

.. doxygenfile:: decodingInput.h
   :project: TensorRT-LLM

speculativeDecodingModule.h
___________________________

.. doxygenfile:: speculativeDecodingModule.h
   :project: TensorRT-LLM

iGptDecoderBatched.h
____________________

.. doxygenfile:: iGptDecoderBatched.h
   :project: TensorRT-LLM

tllmLogger.h
____________

.. doxygenfile:: tllmLogger.h
   :project: TensorRT-LLM

gptDecoderBatched.h
___________________

.. doxygenfile:: gptDecoderBatched.h
   :project: TensorRT-LLM

cudaStream.h
____________

.. doxygenfile:: cudaStream.h
   :project: TensorRT-LLM

samplingConfig.h
________________

.. doxygenfile:: samplingConfig.h
   :project: TensorRT-LLM

request.h
_________

.. doxygenfile:: request.h
   :project: TensorRT-LLM

generationOutput.h
__________________

.. doxygenfile:: generationOutput.h
   :project: TensorRT-LLM

ipcUtils.h
__________

.. doxygenfile:: ipcUtils.h
   :project: TensorRT-LLM

memoryCounters.h
________________

.. doxygenfile:: memoryCounters.h
   :project: TensorRT-LLM