| .. |
|
allocateKvCache.h
|
Update TensorRT-LLM (#2792)
|
2025-02-18 21:27:39 +08:00 |
|
assignReqSeqSlots.h
|
Update TensorRT-LLM (#2436)
|
2024-11-12 15:27:49 +08:00 |
|
cacheTransceiver.h
|
[TRTLLM-8540][feat] Add support for disagg in DSv3.2 (#8735)
|
2025-11-12 08:21:11 -08:00 |
|
capacityScheduler.h
|
fix: max_num_sequences calculation with overlap scheduling (#4532)
|
2025-06-03 09:31:22 +02:00 |
|
common.h
|
open source 4dbf696ae9b74a26829d120b67ab8443d70c8e58 (#2297)
|
2024-10-08 12:19:19 +02:00 |
|
contextProgress.h
|
Update TensorRT-LLM (#2413)
|
2024-11-05 16:27:06 +08:00 |
|
createNewDecoderRequests.h
|
[None] [refactor] Minor cleanup and improvements (#7619)
|
2025-10-03 11:40:06 +02:00 |
|
decoderBuffers.h
|
[None][refactor] decoding inputs, part 2 (#5799)
|
2025-11-18 14:38:51 +01:00 |
|
evictionPolicy.h
|
[TLLM-6777][feature] Support SWA KV cache reuse OOW block detach (#7922)
|
2025-10-13 09:18:12 -07:00 |
|
guidedDecoder.h
|
refactor: Enhanced handling of decoder requests and logits within the batch manager (#6055)
|
2025-07-18 12:12:08 +02:00 |
|
handleContextLogits.h
|
refactor: Speculative decoding buffers part 2 (#5316)
|
2025-06-27 17:41:48 +02:00 |
|
handleGenerationLogits.h
|
refactor: Speculative decoding buffers part 2 (#5316)
|
2025-06-27 17:41:48 +02:00 |
|
kvCacheConnector.h
|
[None][feat] KV Cache Connector API (#7228)
|
2025-08-28 23:09:27 -04:00 |
|
kvCacheEventManager.h
|
[TRTLLM-6881][feat] Include attention dp rank info with KV cache events (#6563)
|
2025-08-07 14:17:07 +02:00 |
|
kvCacheManager.h
|
[https://nvbugs/5689235][fix] Fix cancellation+chunked prefill+disagg (#10111)
|
2026-01-12 18:23:26 -05:00 |
|
kvCacheTransferManager.h
|
[https://nvbugs/5627710][fix] Fix synchronization bugs in KvCacheTransferManager that can cause corrupted blocks (#9056)
|
2025-12-02 09:10:21 -06:00 |
|
kvCacheType.h
|
refactor: remove batch_manager::KvCacheConfig and use executor::KvCacheConfig instead (#5384)
|
2025-06-26 19:45:52 +08:00 |
|
kvCacheUtils.h
|
[None][feat] Add support for KVCache reuse for DSv32 (#9383)
|
2025-12-02 11:14:30 +08:00 |
|
llmRequest.h
|
[https://nvbugs/5689235][fix] Fix cancellation+chunked prefill+disagg (#10111)
|
2026-01-12 18:23:26 -05:00 |
|
logitsPostProcessor.h
|
[None][chore] Mass integration of release/1.0 - 3rd (#7519)
|
2025-09-08 14:03:04 +08:00 |
|
makeDecodingBatchInputOutput.h
|
[None][refactor] decoding inputs, part 2 (#5799)
|
2025-11-18 14:38:51 +01:00 |
|
medusaBuffers.h
|
Update TensorRT-LLM (#2873)
|
2025-03-11 21:13:42 +08:00 |
|
microBatchScheduler.h
|
[TRTLLM-3429] feat: Overlap scheduling in C++ runtime (#3625)
|
2025-05-06 15:06:46 +02:00 |
|
pauseRequests.h
|
Update TensorRT-LLM (#2532)
|
2024-12-04 21:16:56 +08:00 |
|
peftCacheManager.h
|
Update TensorRT-LLM (#2783)
|
2025-02-13 18:40:22 +08:00 |
|
peftCacheManagerConfig.h
|
Update TensorRT-LLM (#2755)
|
2025-02-11 03:01:00 +00:00 |
|
promptTuningBuffers.h
|
feat: Offloading Multimodal embedding table to CPU in Chunked Prefill Mode (#3380)
|
2025-04-21 14:31:01 +08:00 |
|
rnnStateManager.h
|
Update TensorRT-LLM (#2413)
|
2024-11-05 16:27:06 +08:00 |
|
runtimeBuffers.h
|
Revert "feat: nanobind bindings (#5961)" (#6160)
|
2025-07-18 10:12:54 +08:00 |
|
sequenceSlotManager.h
|
Update TensorRT-LLM (#2413)
|
2024-11-05 16:27:06 +08:00 |
|
transformerBuffers.h
|
refactor: remove batch_manager::KvCacheConfig and use executor::KvCacheConfig instead (#5384)
|
2025-06-26 19:45:52 +08:00 |
|
updateDecoderBuffers.h
|
refactor: Speculative decoding buffers part 2 (#5316)
|
2025-06-27 17:41:48 +02:00 |