Runtime ========== .. Here are files in the cpp/include/runtime .. We manually add subsection to enable detailed description in the future .. It is also doable to automatically generate this file and list all the modules in the conf.py lookaheadBuffers.h __________________ .. doxygenfile:: lookaheadBuffers.h :project: TensorRT-LLM lookaheadModule.h _________________ .. doxygenfile:: lookaheadModule.h :project: TensorRT-LLM iBuffer.h _________ .. doxygenfile:: iBuffer.h :project: TensorRT-LLM modelConfig.h _____________ .. doxygenfile:: modelConfig.h :project: TensorRT-LLM decodingOutput.h ________________ .. doxygenfile:: decodingOutput.h :project: TensorRT-LLM promptTuningParams.h ____________________ .. doxygenfile:: promptTuningParams.h :project: TensorRT-LLM bufferManager.h _______________ .. doxygenfile:: bufferManager.h :project: TensorRT-LLM gptJsonConfig.h _______________ .. doxygenfile:: gptJsonConfig.h :project: TensorRT-LLM runtimeDefaults.h _________________ .. doxygenfile:: runtimeDefaults.h :project: TensorRT-LLM loraCache.h ___________ .. doxygenfile:: loraCache.h :project: TensorRT-LLM rawEngine.h ___________ .. doxygenfile:: rawEngine.h :project: TensorRT-LLM gptDecoder.h ____________ .. doxygenfile:: gptDecoder.h :project: TensorRT-LLM eagleBuffers.h ______________ .. doxygenfile:: eagleBuffers.h :project: TensorRT-LLM medusaModule.h ______________ .. doxygenfile:: medusaModule.h :project: TensorRT-LLM explicitDraftTokensBuffers.h ____________________________ .. doxygenfile:: explicitDraftTokensBuffers.h :project: TensorRT-LLM iTensor.h _________ .. doxygenfile:: iTensor.h :project: TensorRT-LLM common.h ________ .. doxygenfile:: common.h :project: TensorRT-LLM loraCachePageManagerConfig.h ____________________________ .. doxygenfile:: loraCachePageManagerConfig.h :project: TensorRT-LLM worldConfig.h _____________ .. doxygenfile:: worldConfig.h :project: TensorRT-LLM loraModule.h ____________ .. doxygenfile:: loraModule.h :project: TensorRT-LLM speculativeDecodingMode.h _________________________ .. doxygenfile:: speculativeDecodingMode.h :project: TensorRT-LLM cudaEvent.h ___________ .. doxygenfile:: cudaEvent.h :project: TensorRT-LLM decodingInput.h _______________ .. doxygenfile:: decodingInput.h :project: TensorRT-LLM speculativeDecodingModule.h ___________________________ .. doxygenfile:: speculativeDecodingModule.h :project: TensorRT-LLM iGptDecoderBatched.h ____________________ .. doxygenfile:: iGptDecoderBatched.h :project: TensorRT-LLM eagleModule.h _____________ .. doxygenfile:: eagleModule.h :project: TensorRT-LLM tllmLogger.h ____________ .. doxygenfile:: tllmLogger.h :project: TensorRT-LLM gptDecoderBatched.h ___________________ .. doxygenfile:: gptDecoderBatched.h :project: TensorRT-LLM cudaStream.h ____________ .. doxygenfile:: cudaStream.h :project: TensorRT-LLM ipcNvlsMemory.h _______________ .. doxygenfile:: ipcNvlsMemory.h :project: TensorRT-LLM samplingConfig.h ________________ .. doxygenfile:: samplingConfig.h :project: TensorRT-LLM request.h _________ .. doxygenfile:: request.h :project: TensorRT-LLM decoderState.h ______________ .. doxygenfile:: decoderState.h :project: TensorRT-LLM ipcUtils.h __________ .. doxygenfile:: ipcUtils.h :project: TensorRT-LLM memoryCounters.h ________________ .. doxygenfile:: memoryCounters.h :project: TensorRT-LLM