| .. |
|
disagg_config_cache_aware_balance_deepseek_v3.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_cache_aware_balance.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_cache_reuse_deepseek_v3.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_cache_reuse.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_conditional_deepseek_v3.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_conditional.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxpp2_genpp2.yaml
|
feat: Add support for disaggregation with pp with pytorch backend (#6369)
|
2025-07-30 09:42:13 -04:00 |
|
disagg_config_ctxpp2_gentp2.yaml
|
feat: Add support for disaggregation with pp with pytorch backend (#6369)
|
2025-07-30 09:42:13 -04:00 |
|
disagg_config_ctxpp4_genpp4.yaml
|
feat: Add support for disaggregation with pp with pytorch backend (#6369)
|
2025-07-30 09:42:13 -04:00 |
|
disagg_config_ctxtp1_gentp1_deepseek_v3_lite_one_mtp_attention_dp_overlap.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp1_gentp1_deepseek_v3_lite_one_mtp.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp1_gentp1_deepseek_v3_lite_two_mtp.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp1_gentp1_deepseek_v3_lite.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_genpp2.yaml
|
feat: Add support for disaggregation with pp with pytorch backend (#6369)
|
2025-07-30 09:42:13 -04:00 |
|
disagg_config_ctxtp2_gentp1_trt_backend.yaml
|
[BREAKING CHANGE]: change default backend to PyTorch in trtllm-serve (#5717)
|
2025-07-21 21:09:43 +08:00 |
|
disagg_config_ctxtp2_gentp1.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_one_mtp.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_one.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_overlap_cuda_graph.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_overlap.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_mpi.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_nixl.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_overlap_cuda_graph.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_ucx.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2_gentp2_deepseek_v3_lite.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ctxtp2pp2_gentp2pp2.yaml
|
feat: Add support for disaggregation with pp with pytorch backend (#6369)
|
2025-07-30 09:42:13 -04:00 |
|
disagg_config_cuda_graph_padding.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_gen_only_trt_backend.yaml
|
[BREAKING CHANGE]: change default backend to PyTorch in trtllm-serve (#5717)
|
2025-07-21 21:09:43 +08:00 |
|
disagg_config_gen_only.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_load_balance.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_mixed.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_ngram.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_overlap.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |
|
disagg_config_trt_backend.yaml
|
[BREAKING CHANGE]: change default backend to PyTorch in trtllm-serve (#5717)
|
2025-07-21 21:09:43 +08:00 |
|
disagg_config_trtllm_sampler.yaml
|
chore:[BREAKING CHANGE] use cacheTransceiverConfig as knobs for disagg service (#5234)
|
2025-07-17 17:42:07 +08:00 |