TensorRT-LLMs/tests/integration/defs/disaggregated/test_configs
2026-02-02 09:54:33 +08:00
..
disagg_config_cache_aware_balance_deepseek_v3.yaml
disagg_config_cache_aware_balance.yaml
disagg_config_cache_reuse_deepseek_v3.yaml
disagg_config_cache_reuse.yaml
disagg_config_cancel_stress_test_large.yaml
disagg_config_cancel_stress_test.yaml
disagg_config_conditional_deepseek_v3.yaml
disagg_config_conditional.yaml
disagg_config_ctxpp2_genpp2.yaml
disagg_config_ctxpp2_gentp2.yaml
disagg_config_ctxpp4_genpp4.yaml
disagg_config_ctxpp4_gentp4.yaml
disagg_config_ctxtp1_gentp1_deepseek_v3_lite_one_mtp_attention_dp_overlap.yaml
disagg_config_ctxtp1_gentp1_deepseek_v3_lite_one_mtp_ctxpp2_gentp2.yaml
disagg_config_ctxtp1_gentp1_deepseek_v3_lite_one_mtp.yaml
disagg_config_ctxtp1_gentp1_deepseek_v3_lite_two_mtp.yaml
disagg_config_ctxtp1_gentp1_deepseek_v3_lite.yaml
disagg_config_ctxtp2_genpp2.yaml
disagg_config_ctxtp2_gentp1_trt_backend.yaml
disagg_config_ctxtp2_gentp1.yaml
disagg_config_ctxtp2_gentp1cp2_deepseek_v3_lite_bf16_tllm_gen.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_one_mtp.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_one.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_overlap_cuda_graph.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp_overlap.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_attention_dp.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_mpi.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_nixl.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_overlap_cuda_graph.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite_ucx.yaml
disagg_config_ctxtp2_gentp2_deepseek_v3_lite.yaml
disagg_config_ctxtp2_gentp2_gptoss_tllm.yaml
disagg_config_ctxtp2pp2_gentp2pp2.yaml
disagg_config_ctxtp4_gentp4_deepseek_r1_v2_fp4_tllm.yaml
disagg_config_cuda_graph_padding.yaml
disagg_config_deepseek_v3_lite_empty_batch.yaml
disagg_config_diff_max_tokens.yaml
disagg_config_gen_only_bs1.yaml
disagg_config_gen_only_trt_backend.yaml
disagg_config_gen_only.yaml
disagg_config_llama4_kv_cache_overflow.yaml
disagg_config_load_balance.yaml
disagg_config_metrics.yaml
disagg_config_mixed.yaml [https://nvbugs/5834212][fix] prevent routing ctx and gen requests to the same worker; update doc for unique disagg ID (#11095) 2026-02-02 09:54:33 +08:00
disagg_config_ngram.yaml
disagg_config_overlap.yaml
disagg_config_trt_backend.yaml
disagg_config_trtllm_sampler.yaml