TensorRT-LLMs

mirror of https://github.com/NVIDIA/TensorRT-LLM.git synced 2026-01-27 22:23:25 +08:00

History

Jonas Yang CN 88ea2c4ee9 [TRTLLM-7349][feat] Adding new orchestrator type -- ray (#7520 ) Signed-off-by: Erin Ho <14718778+hchings@users.noreply.github.com> Co-authored-by: Yuan Tong <13075180+tongyuantongyu@users.noreply.github.com> Co-authored-by: Erin Ho <14718778+hchings@users.noreply.github.com>		2025-10-04 08:12:24 +08:00
..
utils	[TRTLLM-7349][feat] Adding new orchestrator type -- ray (#7520 )	2025-10-04 08:12:24 +08:00
bufferManager.h
common.h	[TRTLLM-7398][feat] Support KV cache salting for secure KV cache reuse (#7106 )	2025-09-06 17:58:32 -04:00
cudaEvent.h
cudaStream.h
decoderState.h	[None][refactor] Simplify decoder state initialization (#6559 )	2025-08-12 21:44:41 +02:00
decodingInput.h	[None][refactor] Simplify decoder state initialization for speculative decoding (#6869 )	2025-08-22 18:44:17 +02:00
decodingOutput.h
eagleBuffers.h
eagleModule.h
explicitDraftTokensBuffers.h
gptDecoder.h	[TRTLLM-6785][feat] BREAKING CHANGE Enable TRTLLM sampler by default (#6216 )	2025-08-07 22:19:37 -04:00
gptDecoderBatched.h	[TRTLLM-6785][feat] BREAKING CHANGE Enable TRTLLM sampler by default (#6216 )	2025-08-07 22:19:37 -04:00
gptJsonConfig.h
iBuffer.h
iGptDecoderBatched.h	[TRTLLM-6785][feat] BREAKING CHANGE Enable TRTLLM sampler by default (#6216 )	2025-08-07 22:19:37 -04:00
ipcNvlsMemory.h
ipcUtils.h
iTensor.h
lookaheadBuffers.h
lookaheadModule.h	[None] [refactor] Minor cleanup and improvements (#7619 )	2025-10-03 11:40:06 +02:00
loraCache.h
loraCachePageManagerConfig.h
loraModule.h
medusaModule.h
memoryCounters.h
modelConfig.h	[None] [refactor] Minor cleanup and improvements (#7619 )	2025-10-03 11:40:06 +02:00
promptTuningParams.h
rawEngine.h
runtimeDefaults.h
samplingConfig.h
speculativeDecodingMode.h
speculativeDecodingModule.h
tllmLogger.h
virtualMemory.h	[TRTLLM-4406][feat] LLM sleep & wakeup Part 1: virtual device memory (#5034 )	2025-08-04 13:51:01 +08:00
worldConfig.h