Skip to content

Commit 8cecd30

Browse files
authored
Update hpu_model_runner.py
1 parent b05a82b commit 8cecd30

File tree

1 file changed

+3
-2
lines changed

1 file changed

+3
-2
lines changed

vllm_gaudi/v1/worker/hpu_model_runner.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2591,7 +2591,8 @@ def warmup_model(self) -> None:
25912591
self.bucketing_manager.generate_prompt_buckets()
25922592
self.bucketing_manager.generate_decode_buckets()
25932593

2594-
if self.bucketing_manager.decode_buckets[-1][0] > self.input_batch.max_num_reqs:
2594+
max_bucket = max(self.bucketing_manager.decode_buckets[-1][0], self.bucketing_manager.prompt_buckets[-1][0])
2595+
if max_bucket > self.input_batch.max_num_reqs:
25952596
input_batch_bkp = self.input_batch
25962597
self.input_batch = InputBatch(
25972598
max_num_reqs=self.bucketing_manager.decode_buckets[-1][0],
@@ -2687,7 +2688,7 @@ def warmup_model(self) -> None:
26872688
logger.info(msg)
26882689
self.profiler.end()
26892690

2690-
if self.bucketing_manager.decode_buckets[-1][0] > self.input_batch.max_num_reqs:
2691+
if max_bucket > self.input_batch.max_num_reqs:
26912692
self.input_batch = input_batch_bkp
26922693

26932694
def shutdown_inc(self):

0 commit comments

Comments
 (0)