Skip to content

Commit d01a546

Browse files
ShunkangShunkang
authored andcommitted
Refactor test
Signed-off-by: Shunkang <[email protected]>
1 parent 8b4a728 commit d01a546

File tree

2 files changed

+388
-438
lines changed

2 files changed

+388
-438
lines changed

tensorrt_llm/_torch/pyexecutor/executor_request_queue.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -293,6 +293,8 @@ def _filter_out_unschedulable_requests(
293293
unscheduled_requests.append(req_item)
294294
else:
295295
pending_requests.append(req_item)
296+
else:
297+
unscheduled_requests.append(req_item)
296298
else:
297299
unscheduled_requests.append(req_item)
298300

@@ -312,7 +314,7 @@ def _schedule_attention_dp_requests(
312314
# Schedule the requests with attention dp rank and no relax
313315
for req_item in scheduled_requests:
314316
target_dp_rank = req_item.request.py_schedule_params.attention_dp_rank
315-
assert self.all_ranks_num_active_requests[target_dp_rank] < self.max_num_active_requests, \
317+
assert self.all_ranks_num_active_requests[target_dp_rank] <= self.max_num_active_requests, \
316318
f"The number of active requests on rank {target_dp_rank} is {self.all_ranks_num_active_requests[target_dp_rank]}, " \
317319
f"which is greater than the max_num_active_requests {self.max_num_active_requests}"
318320
self.all_ranks_num_active_requests[target_dp_rank] += 1

0 commit comments

Comments
 (0)