File tree Expand file tree Collapse file tree 2 files changed +7
-1
lines changed Expand file tree Collapse file tree 2 files changed +7
-1
lines changed Original file line number Diff line number Diff line change @@ -358,8 +358,8 @@ class TestLlama3_1_8BInstruct(LlmapiAccuracyTestHarness):
358358 MODEL_NAME = "meta-llama/Llama-3.1-8B-Instruct"
359359 MODEL_PATH = f"{ llm_models_root ()} /llama-3.1-model/Llama-3.1-8B-Instruct"
360360
361+ @skip_pre_hopper
361362 @pytest .mark .skip_less_device (2 )
362- @pytest .mark .skip_less_device_memory (32000 )
363363 @pytest .mark .parametrize ("disable_overlap_scheduler" , [False , True ])
364364 @pytest .mark .parametrize ("ctx_enable_block_reuse" , [True , False ])
365365 @pytest .mark .parametrize ("gen_enable_block_reuse" , [True , False ])
Original file line number Diff line number Diff line change @@ -389,3 +389,9 @@ unittest/llmapi/test_llm_multi_gpu_pytorch.py::test_llm_rpc_tp2 SKIP (https://nv
389389accuracy/test_llm_api_pytorch.py::TestQwen2_VL_7B::test_auto_dtype SKIP (https://nvbugs/5602338)
390390unittest/llmapi/test_memory_profiling.py SKIP (https://nvbugs/5580781)
391391test_e2e.py::test_ptp_quickstart_multimodal[qwen2.5-vl-7b-instruct-Qwen2.5-VL-7B-Instruct-image-False] SKIP (https://nvbugs/5568825)
392+ accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[GSM8K-gen_tp=1-ctx_pp=2] SKIP (https://nvbugs/5582277)
393+ accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[GSM8K-gen_tp=1-ctx_pp=4] SKIP (https://nvbugs/5582277)
394+ accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[GSM8K-gen_tp=2-ctx_pp=2] SKIP (https://nvbugs/5582277)
395+ accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[GSM8K-gen_tp=2-ctx_pp=4] SKIP (https://nvbugs/5582277)
396+ accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[MMLU-gen_tp=2-ctx_pp=2] SKIP (https://nvbugs/5582277)
397+ accuracy/test_disaggregated_serving.py::TestLlama3_1_8BInstruct::test_ctx_pp_gen_tp_asymmetric[MMLU-gen_tp=2-ctx_pp=4] SKIP (https://nvbugs/5582277)
You can’t perform that action at this time.
0 commit comments