From f2dd0ee128c491813c3667b2635d1c60b780df57 Mon Sep 17 00:00:00 2001 From: Liao Lanyu <108499334+lancelly@users.noreply.github.com> Date: Fri, 30 Jan 2026 16:06:48 +0800 Subject: [PATCH] [None][chore] Correct sorting order for attention DP scheduling to prioritize non-relaxed requests (#11106) Signed-off-by: Lance Liao <108499334+lancelly@users.noreply.github.com> --- tensorrt_llm/_torch/pyexecutor/executor_request_queue.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensorrt_llm/_torch/pyexecutor/executor_request_queue.py b/tensorrt_llm/_torch/pyexecutor/executor_request_queue.py index d0442139cf..dd8633411c 100644 --- a/tensorrt_llm/_torch/pyexecutor/executor_request_queue.py +++ b/tensorrt_llm/_torch/pyexecutor/executor_request_queue.py @@ -445,7 +445,7 @@ class ExecutorRequestQueue: return True return scheduling_params.attention_dp_relax - new_requests = sorted(new_requests, key=get_relax_value, reverse=True) + new_requests = sorted(new_requests, key=get_relax_value) # Try to put the requests to the target dp rank until the max_num_active_requests is reached remaining_unscheduled = []