Skip to content

Commit b0de043

Browse files
committed
fix ci
Signed-off-by: MengqingCao <[email protected]>
1 parent 54582c7 commit b0de043

File tree

3 files changed

+10
-8
lines changed

3 files changed

+10
-8
lines changed

.github/workflows/vllm_ascend_test.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -40,8 +40,8 @@ concurrency:
4040
cancel-in-progress: true
4141

4242
jobs:
43-
# lint:
44-
# uses: ./.github/workflows/pre-commit.yml
43+
lint:
44+
uses: ./.github/workflows/pre-commit.yml
4545

4646
changes:
4747
runs-on: ubuntu-latest

tests/e2e/singlecard/sample/test_rejection_sampler.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
import pytest
55
import torch
66
import torch.nn.functional as F
7-
from vllm.v1.sample.logits_processor import LogitsProcessorManager
7+
from vllm.v1.sample.logits_processor import LogitsProcessors
88
from vllm.v1.sample.metadata import SamplingMetadata
99
from vllm.v1.spec_decode.metadata import SpecDecodeMetadata
1010

@@ -66,7 +66,7 @@ def create_sampling_metadata(
6666
output_token_ids=[],
6767
allowed_token_ids_mask=None,
6868
bad_words_token_ids={},
69-
logitsprocs=LogitsProcessorManager())
69+
logitsprocs=LogitsProcessors())
7070

7171

7272
########################### Tests for Greedy Sampling ###################

vllm_ascend/worker/model_runner_v1.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1074,8 +1074,8 @@ def _process_reqs(
10741074
num_input_tokens)
10751075
num_input_tokens += num_pad
10761076

1077-
modified_batch = self.attn_metadata_builder.reorder_batch(
1078-
self.input_batch, scheduler_output)
1077+
self.attn_metadata_builder.reorder_batch(self.input_batch,
1078+
scheduler_output)
10791079
# OPTIMIZATION: Start copying the block table first.
10801080
# This way, we can overlap the copy with the following CPU operations.
10811081
self.input_batch.block_table.commit_block_table(num_reqs)
@@ -2482,10 +2482,12 @@ def _capture_aclgraphs(self, compilation_cases: list[int],
24822482
self._dummy_run(num_tokens,
24832483
aclgraph_runtime_mode=CUDAGraphMode.NONE,
24842484
force_attention=force_attention,
2485-
uniform_decode=uniform_decode)
2485+
uniform_decode=uniform_decode,
2486+
moe_comm_method=self.moe_comm_method)
24862487
self._dummy_run(num_tokens,
24872488
aclgraph_runtime_mode=aclgraph_runtime_mode,
2488-
uniform_decode=uniform_decode)
2489+
uniform_decode=uniform_decode,
2490+
moe_comm_method=self.moe_comm_method)
24892491

24902492
def _capture_model(self):
24912493
if not self.use_aclgraph:

0 commit comments

Comments
 (0)