Runtime ========== .. Here are files in the cpp/include/runtime .. We manually add subsection to enable detailed description in the future .. It is also doable to automatically generate this file and list all the modules in the conf.py gptJsonConfig.h _______________ .. doxygenfile:: gptJsonConfig.h :project: TensorRT-LLM tllmLogger.h ____________ .. doxygenfile:: tllmLogger.h :project: TensorRT-LLM worldConfig.h _____________ .. doxygenfile:: worldConfig.h :project: TensorRT-LLM common.h ________ .. doxygenfile:: common.h :project: TensorRT-LLM ipcUtils.h __________ .. doxygenfile:: ipcUtils.h :project: TensorRT-LLM iGptDecoderBatched.h ____________________ .. doxygenfile:: iGptDecoderBatched.h :project: TensorRT-LLM eagleBuffers.h ______________ .. doxygenfile:: eagleBuffers.h :project: TensorRT-LLM samplingConfig.h ________________ .. doxygenfile:: samplingConfig.h :project: TensorRT-LLM speculativeDecodingMode.h _________________________ .. doxygenfile:: speculativeDecodingMode.h :project: TensorRT-LLM memoryCounters.h ________________ .. doxygenfile:: memoryCounters.h :project: TensorRT-LLM runtimeDefaults.h _________________ .. doxygenfile:: runtimeDefaults.h :project: TensorRT-LLM decodingOutput.h ________________ .. doxygenfile:: decodingOutput.h :project: TensorRT-LLM decoderState.h ______________ .. doxygenfile:: decoderState.h :project: TensorRT-LLM gptDecoder.h ____________ .. doxygenfile:: gptDecoder.h :project: TensorRT-LLM explicitDraftTokensBuffers.h ____________________________ .. doxygenfile:: explicitDraftTokensBuffers.h :project: TensorRT-LLM decodingInput.h _______________ .. doxygenfile:: decodingInput.h :project: TensorRT-LLM lookaheadModule.h _________________ .. doxygenfile:: lookaheadModule.h :project: TensorRT-LLM bufferManager.h _______________ .. doxygenfile:: bufferManager.h :project: TensorRT-LLM rawEngine.h ___________ .. doxygenfile:: rawEngine.h :project: TensorRT-LLM loraModule.h ____________ .. doxygenfile:: loraModule.h :project: TensorRT-LLM request.h _________ .. doxygenfile:: request.h :project: TensorRT-LLM cudaStream.h ____________ .. doxygenfile:: cudaStream.h :project: TensorRT-LLM cudaEvent.h ___________ .. doxygenfile:: cudaEvent.h :project: TensorRT-LLM modelConfig.h _____________ .. doxygenfile:: modelConfig.h :project: TensorRT-LLM ipcNvlsMemory.h _______________ .. doxygenfile:: ipcNvlsMemory.h :project: TensorRT-LLM iTensor.h _________ .. doxygenfile:: iTensor.h :project: TensorRT-LLM gptDecoderBatched.h ___________________ .. doxygenfile:: gptDecoderBatched.h :project: TensorRT-LLM eagleModule.h _____________ .. doxygenfile:: eagleModule.h :project: TensorRT-LLM loraCache.h ___________ .. doxygenfile:: loraCache.h :project: TensorRT-LLM loraCachePageManagerConfig.h ____________________________ .. doxygenfile:: loraCachePageManagerConfig.h :project: TensorRT-LLM speculativeDecodingModule.h ___________________________ .. doxygenfile:: speculativeDecodingModule.h :project: TensorRT-LLM lookaheadBuffers.h __________________ .. doxygenfile:: lookaheadBuffers.h :project: TensorRT-LLM promptTuningParams.h ____________________ .. doxygenfile:: promptTuningParams.h :project: TensorRT-LLM medusaModule.h ______________ .. doxygenfile:: medusaModule.h :project: TensorRT-LLM iBuffer.h _________ .. doxygenfile:: iBuffer.h :project: TensorRT-LLM