Skip to content

Commit fc977d3

Browse files
committed
[https://nvbugs/5448437][fix] fix some nixl tests (NVIDIA#6940)
Signed-off-by: Bo Deng <[email protected]>
1 parent 92daec1 commit fc977d3

File tree

4 files changed

+11
-9
lines changed

4 files changed

+11
-9
lines changed

tests/integration/defs/accuracy/test_disaggregated_serving.py

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@
2323
from tensorrt_llm.llmapi.tokenizer import load_hf_tokenizer
2424

2525
from ..conftest import (get_device_count, llm_models_root, parametrize_with_ids,
26-
skip_pre_blackwell, skip_pre_hopper)
26+
skip_no_hopper, skip_pre_blackwell, skip_pre_hopper)
2727
from ..trt_test_alternative import popen
2828
from .accuracy_core import (GSM8K, MMLU, JsonModeEval,
2929
LlmapiAccuracyTestHarness, get_accuracy_task)
@@ -590,6 +590,9 @@ class TestDeepSeekV3Lite(LlmapiAccuracyTestHarness):
590590
MODEL_NAME = "deepseek-ai/DeepSeek-V3-Lite"
591591
MODEL_PATH = f"{llm_models_root()}/DeepSeek-V3-Lite/bf16"
592592

593+
@pytest.mark.skip_less_device(2)
594+
@pytest.mark.skip_less_device_memory(60000)
595+
@skip_no_hopper
593596
def test_nixl_backend(self):
594597
ctx_server_config = {
595598
"disable_overlap_scheduler": True,
@@ -726,6 +729,8 @@ class TestQwen3_8B(LlmapiAccuracyTestHarness):
726729
MODEL_NAME = "Qwen3/Qwen3-8B"
727730
MODEL_PATH = f"{llm_models_root()}/Qwen3/Qwen3-8B-FP8"
728731

732+
@pytest.mark.skip_less_device(2)
733+
@skip_no_hopper
729734
def test_nixl_backend(self):
730735
ctx_server_config = {
731736
"disable_overlap_scheduler": True,
@@ -755,8 +760,6 @@ def test_nixl_backend(self):
755760
with launch_disaggregated_llm(disaggregated_server_config,
756761
ctx_server_config, gen_server_config,
757762
self.MODEL_PATH) as llm:
758-
task = MMLU(self.MODEL_NAME)
759-
task.evaluate(llm)
760763
task = GSM8K(self.MODEL_NAME)
761764
task.evaluate(llm)
762765

tests/integration/defs/disaggregated/test_disaggregated.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,8 @@
2020

2121
import pytest
2222
import yaml
23-
from defs.conftest import llm_models_root, skip_arm, skip_no_hopper
23+
from defs.conftest import (get_sm_version, llm_models_root, skip_arm,
24+
skip_no_hopper)
2425
from defs.trt_test_alternative import check_call, check_output, popen
2526

2627
from tensorrt_llm.logger import logger
@@ -1270,6 +1271,9 @@ def get_config_for_benchmark(model_root, backend):
12701271
def test_disaggregated_benchmark_on_diff_backends(
12711272
disaggregated_test_root, disaggregated_example_root, llm_venv,
12721273
benchmark_model_root, benchmark_root, shared_gpt_path):
1274+
if "DeepSeek-V3-Lite" in benchmark_model_root and "fp8" in benchmark_model_root and get_sm_version(
1275+
) != 90:
1276+
pytest.skip("The test should only run on Hopper")
12731277
nixl_config = get_config_for_benchmark(benchmark_model_root, "NIXL")
12741278
ucx_config = get_config_for_benchmark(benchmark_model_root, "UCX")
12751279
temp_dir = tempfile.TemporaryDirectory()

tests/integration/test_lists/test-db/l0_dgx_b200.yml

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -86,6 +86,3 @@ l0_dgx_b200:
8686
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[DeepSeek-V3-Lite-bf16]
8787
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[llama-v3-8b-hf]
8888
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[llama-3.1-8b-instruct-hf-fp8]
89-
- disaggregated/test_disaggregated.py::test_disaggregated_benchmark_on_diff_backends[DeepSeek-V3-Lite-fp8]
90-
- accuracy/test_disaggregated_serving.py::TestQwen3_8B::test_nixl_backend
91-
- accuracy/test_disaggregated_serving.py::TestDeepSeekV3Lite::test_nixl_backend

tests/integration/test_lists/waives.txt

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -302,8 +302,6 @@ triton_server/test_triton.py::test_mistral_ib_mm[mistral-ib-mm] SKIP (https://nv
302302
triton_server/test_triton.py::test_t5_ib[t5-ib] SKIP (https://nvbugs/5456482)
303303
triton_server/test_triton_llm.py::test_gpt_speculative_decoding_bls[False-False-1---False-True-True-0-128-disableDecoupleMode-inflight_fused_batching-disableTrtOverlap-0.2-guaranteed_no_evict---1-1-1-False-ensemble] SKIP (https://nvbugs/5456485)
304304
accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[GSM8K-gen_tp=1-ctx_pp=4] SKIP (https://nvbugs/5434320)
305-
accuracy/test_disaggregated_serving.py::TestQwen3_8B::test_nixl_backend SKIP (https://nvbugs/5448437)
306-
accuracy/test_disaggregated_serving.py::TestDeepSeekV3Lite::test_nixl_backend SKIP (https://nvbugs/5448437)
307305
accuracy/test_llm_api_pytorch.py::TestDeepSeekR1::test_nvfp4_multi_gpus[latency_trtllmgen] SKIP (https://nvbugs/5445466)
308306
accuracy/test_llm_api_pytorch.py::TestDeepSeekR1::test_nvfp4_multi_gpus[latency] SKIP (https://nvbugs/5445466)
309307
test_e2e.py::test_ptp_quickstart_multimodal[mistral-small-3.1-24b-instruct-Mistral-Small-3.1-24B-Instruct-2503-image-True] SKIP (https://nvbugs/5459817)

0 commit comments

Comments
 (0)