Runtime
==========

.. Here are files in the cpp/include/runtime
.. We manually add subsection to enable detailed description in the future
.. It is also doable to automatically generate this file and list all the modules in the conf.py
iStatefulGptDecoder.h
_____________________

.. doxygenfile:: iStatefulGptDecoder.h
   :project: TensorRT-LLM

lookaheadModule.h
_________________

.. doxygenfile:: lookaheadModule.h
   :project: TensorRT-LLM

iTensor.h
_________

.. doxygenfile:: iTensor.h
   :project: TensorRT-LLM

speculativeDecodingMode.h
_________________________

.. doxygenfile:: speculativeDecodingMode.h
   :project: TensorRT-LLM

eagleBuffers.h
______________

.. doxygenfile:: eagleBuffers.h
   :project: TensorRT-LLM

decodingInput.h
_______________

.. doxygenfile:: decodingInput.h
   :project: TensorRT-LLM

memoryCounters.h
________________

.. doxygenfile:: memoryCounters.h
   :project: TensorRT-LLM

gptDecoderBatched.h
___________________

.. doxygenfile:: gptDecoderBatched.h
   :project: TensorRT-LLM

rawEngine.h
___________

.. doxygenfile:: rawEngine.h
   :project: TensorRT-LLM

gptSession.h
____________

.. doxygenfile:: gptSession.h
   :project: TensorRT-LLM

decodingOutput.h
________________

.. doxygenfile:: decodingOutput.h
   :project: TensorRT-LLM

ipcUtils.h
__________

.. doxygenfile:: ipcUtils.h
   :project: TensorRT-LLM

iBuffer.h
_________

.. doxygenfile:: iBuffer.h
   :project: TensorRT-LLM

lookaheadBuffers.h
__________________

.. doxygenfile:: lookaheadBuffers.h
   :project: TensorRT-LLM

bufferManager.h
_______________

.. doxygenfile:: bufferManager.h
   :project: TensorRT-LLM

loraCachePageManagerConfig.h
____________________________

.. doxygenfile:: loraCachePageManagerConfig.h
   :project: TensorRT-LLM

loraCache.h
___________

.. doxygenfile:: loraCache.h
   :project: TensorRT-LLM

speculativeDecodingModule.h
___________________________

.. doxygenfile:: speculativeDecodingModule.h
   :project: TensorRT-LLM

cudaStream.h
____________

.. doxygenfile:: cudaStream.h
   :project: TensorRT-LLM

medusaModule.h
______________

.. doxygenfile:: medusaModule.h
   :project: TensorRT-LLM

common.h
________

.. doxygenfile:: common.h
   :project: TensorRT-LLM

samplingConfig.h
________________

.. doxygenfile:: samplingConfig.h
   :project: TensorRT-LLM

tllmLogger.h
____________

.. doxygenfile:: tllmLogger.h
   :project: TensorRT-LLM

loraModule.h
____________

.. doxygenfile:: loraModule.h
   :project: TensorRT-LLM

modelConfig.h
_____________

.. doxygenfile:: modelConfig.h
   :project: TensorRT-LLM

worldConfig.h
_____________

.. doxygenfile:: worldConfig.h
   :project: TensorRT-LLM

gptDecoder.h
____________

.. doxygenfile:: gptDecoder.h
   :project: TensorRT-LLM

generationOutput.h
__________________

.. doxygenfile:: generationOutput.h
   :project: TensorRT-LLM

promptTuningParams.h
____________________

.. doxygenfile:: promptTuningParams.h
   :project: TensorRT-LLM

runtimeDefaults.h
_________________

.. doxygenfile:: runtimeDefaults.h
   :project: TensorRT-LLM

generationInput.h
_________________

.. doxygenfile:: generationInput.h
   :project: TensorRT-LLM

request.h
_________

.. doxygenfile:: request.h
   :project: TensorRT-LLM

cudaEvent.h
___________

.. doxygenfile:: cudaEvent.h
   :project: TensorRT-LLM

explicitDraftTokensBuffers.h
____________________________

.. doxygenfile:: explicitDraftTokensBuffers.h
   :project: TensorRT-LLM

iGptDecoderBatched.h
____________________

.. doxygenfile:: iGptDecoderBatched.h
   :project: TensorRT-LLM

gptJsonConfig.h
_______________

.. doxygenfile:: gptJsonConfig.h
   :project: TensorRT-LLM