mirror of
https://github.com/NVIDIA/TensorRT-LLM.git
synced 2026-01-14 06:27:45 +08:00
4 lines
70 B
YAML
4 lines
70 B
YAML
cache_transceiver_config:
|
|
backend: UCX
|
|
max_tokens_in_buffer: 2048
|