Skip to content

Commit 4a09d88

Browse files
committed
[https://nvbugs/5448437,https://nvbugs/5448449][fix] fix some nixl tests
Signed-off-by: Bo Deng <[email protected]>
1 parent a32a2e4 commit 4a09d88

File tree

4 files changed

+10
-11
lines changed

4 files changed

+10
-11
lines changed

tests/integration/defs/accuracy/test_disaggregated_serving.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
from tensorrt_llm.llmapi.llm_args import LlmArgs
2222

2323
from ..conftest import (get_device_count, llm_models_root, parametrize_with_ids,
24-
skip_pre_hopper)
24+
skip_no_hopper, skip_pre_hopper)
2525
from ..trt_test_alternative import popen
2626
from .accuracy_core import (GSM8K, MMLU, LlmapiAccuracyTestHarness,
2727
get_accuracy_task)
@@ -503,6 +503,7 @@ class TestDeepSeekV3Lite(LlmapiAccuracyTestHarness):
503503
MODEL_NAME = "deepseek-ai/DeepSeek-V3-Lite"
504504
MODEL_PATH = f"{llm_models_root()}/DeepSeek-V3-Lite/bf16"
505505

506+
@skip_no_hopper
506507
def test_nixl_backend(self):
507508
ctx_server_config = {
508509
"disable_overlap_scheduler": True,
@@ -634,6 +635,7 @@ class TestQwen3_8B(LlmapiAccuracyTestHarness):
634635
MODEL_NAME = "Qwen3/Qwen3-8B"
635636
MODEL_PATH = f"{llm_models_root()}/Qwen3/Qwen3-8B-FP8"
636637

638+
@skip_no_hopper
637639
def test_nixl_backend(self):
638640
ctx_server_config = {
639641
"disable_overlap_scheduler": True,
@@ -665,8 +667,6 @@ def test_nixl_backend(self):
665667
with launch_disaggregated_llm(disaggregated_server_config,
666668
ctx_server_config, gen_server_config,
667669
self.MODEL_PATH) as llm:
668-
task = MMLU(self.MODEL_NAME)
669-
task.evaluate(llm)
670670
task = GSM8K(self.MODEL_NAME)
671671
task.evaluate(llm)
672672

tests/integration/defs/disaggregated/test_disaggregated.py

Lines changed: 7 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,8 @@
2020

2121
import pytest
2222
import yaml
23-
from defs.conftest import llm_models_root, skip_arm, skip_no_hopper
23+
from defs.conftest import (get_sm_version, llm_models_root, skip_arm,
24+
skip_no_hopper)
2425
from defs.trt_test_alternative import check_call, check_output, popen
2526

2627
from tensorrt_llm.logger import logger
@@ -1212,7 +1213,7 @@ def get_config_for_benchmark(model_root, backend):
12121213
"num_instances": 1,
12131214
"max_batch_size": 2,
12141215
"max_num_tokens": 384,
1215-
"max_seq_len": 320,
1216+
"max_seq_len": 384,
12161217
"tensor_parallel_size": 1,
12171218
"pipeline_parallel_size": 1,
12181219
"disable_overlap_scheduler": True,
@@ -1228,7 +1229,7 @@ def get_config_for_benchmark(model_root, backend):
12281229
"pipeline_parallel_size": 1,
12291230
"max_batch_size": 2,
12301231
"max_num_tokens": 384,
1231-
"max_seq_len": 320,
1232+
"max_seq_len": 384,
12321233
"cache_transceiver_config": {
12331234
"backend": backend,
12341235
"max_tokens_in_buffer": 512,
@@ -1247,6 +1248,9 @@ def get_config_for_benchmark(model_root, backend):
12471248
def test_disaggregated_benchmark_on_diff_backends(
12481249
disaggregated_test_root, disaggregated_example_root, llm_venv,
12491250
benchmark_model_root, benchmark_root, shared_gpt_path):
1251+
if "DeepSeek-V3-Lite" in benchmark_model_root and "fp8" in benchmark_model_root and get_sm_version(
1252+
) != 90:
1253+
pytest.skip("The test should only run on Hopper")
12501254
nixl_config = get_config_for_benchmark(benchmark_model_root, "nixl")
12511255
ucx_config = get_config_for_benchmark(benchmark_model_root, "ucx")
12521256
temp_dir = tempfile.TemporaryDirectory()

tests/integration/test_lists/test-db/l0_dgx_b200.yml

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -72,6 +72,3 @@ l0_dgx_b200:
7272
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[DeepSeek-V3-Lite-bf16]
7373
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[llama-v3-8b-hf]
7474
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[llama-3.1-8b-instruct-hf-fp8]
75-
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[DeepSeek-V3-Lite-fp8]
76-
- accuracy/test_disaggregated_serving.py::TestQwen3_8B::test_nixl_backend
77-
- accuracy/test_disaggregated_serving.py::TestDeepSeekV3Lite::test_nixl_backend

tests/integration/test_lists/waives.txt

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -284,6 +284,4 @@ examples/test_gemma.py::test_hf_gemma_fp8_base_bf16_multi_lora[gemma-2-27b-it] S
284284
examples/test_gemma.py::test_hf_gemma_fp8_base_bf16_multi_lora[gemma-3-1b-it] SKIP (https://nvbugs/5434451)
285285
accuracy/test_llm_api_pytorch.py::TestQwen3_235B_A22B::test_nvfp4[latency_moe_trtllm_eagle3] SKIP (https://nvbugs/5437384)
286286
accuracy/test_llm_api_pytorch.py::TestGemma3_27BInstruct::test_fp8_prequantized SKIP (https://nvbugs/5445774)
287-
accuracy/test_disaggregated_serving.py::TestQwen3_8B::test_nixl_backend SKIP (https://nvbugs/5448437)
288-
disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[DeepSeek-V3-Lite-fp8] SKIP (https://nvbugs/5448449)
289287
test_e2e.py::test_ptp_quickstart_multimodal[llava-v1.6-mistral-7b-llava-v1.6-mistral-7b-hf-image-False] SKIP (https://nvbugs/5444095)

0 commit comments

Comments
 (0)