Skip to content

Commit 2cbbccd

Browse files
committed
update waives
Signed-off-by: Xin He (SW-GPU) <[email protected]>
1 parent 8b21613 commit 2cbbccd

File tree

2 files changed

+16
-7
lines changed

2 files changed

+16
-7
lines changed

tests/integration/defs/accuracy/test_llm_api_pytorch.py

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2697,6 +2697,8 @@ def test_auto_dtype_long_rope(self):
26972697
task.evaluate(llm)
26982698

26992699

2700+
@skip_pre_hopper
2701+
@pytest.mark.skip_less_device_memory(100000)
27002702
class TestGPTOSS(LlmapiAccuracyTestHarness):
27012703
kv_cache_config = KvCacheConfig(free_gpu_memory_fraction=0.5)
27022704
extra_evaluator_kwargs = {
@@ -2708,8 +2710,11 @@ class TestGPTOSS(LlmapiAccuracyTestHarness):
27082710

27092711
MODEL_PATH = f"{llm_models_root()}/gpt_oss/gpt-oss-120b"
27102712

2711-
@pytest.mark.parametrize("moe_backend", ["CUTLASS", "TRTLLM", "TRITON"],
2712-
ids=["cutlass", "trtllm", "triton"])
2713+
@pytest.mark.parametrize(
2714+
"moe_backend",
2715+
["CUTLASS",
2716+
pytest.param("TRTLLM", marks=skip_pre_blackwell), "TRITON"],
2717+
ids=["cutlass", "trtllm", "triton"])
27132718
@pytest.mark.parametrize("cuda_graph,overlap_scheduler", [
27142719
(True, True),
27152720
])
@@ -2737,7 +2742,11 @@ def test_w4_1gpu(self, moe_backend, cuda_graph, overlap_scheduler, mocker):
27372742
extra_evaluator_kwargs=self.extra_evaluator_kwargs)
27382743

27392744
@pytest.mark.skip_less_device(4)
2740-
@pytest.mark.parametrize("moe_backend", ["CUTLASS", "TRTLLM", "TRITON"])
2745+
@pytest.mark.parametrize(
2746+
"moe_backend",
2747+
["CUTLASS",
2748+
pytest.param("TRTLLM", marks=skip_pre_blackwell), "TRITON"],
2749+
ids=["cutlass", "trtllm", "triton"])
27412750
@pytest.mark.parametrize(
27422751
"tp_size,pp_size,ep_size,attention_dp,cuda_graph,overlap_scheduler", [
27432752
(4, 1, 1, False, True, True),

tests/integration/test_lists/waives.txt

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -337,15 +337,15 @@ accuracy/test_cli_flow.py::TestLongAlpaca7B::test_auto_dtype SKIP (https://nvbug
337337
accuracy/test_llm_api.py::TestPhi4MiniInstruct::test_fp8 SKIP (https://nvbugs/5465143)
338338
accuracy/test_llm_api_pytorch.py::TestDeepSeekR1::test_fp8_blockscale[throughput] SKIP (https://nvbugs/5471106)
339339
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_1gpu[True-True-cutlass] SKIP (https://nvbugs/5481080)
340-
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_1gpu[True-True-trtllm] SKIP (https://nvbugs/5481087)
341340
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_4gpus[tp4-CUTLASS] SKIP (https://nvbugs/5481080)
342-
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_4gpus[tp4-TRTLLM] SKIP (https://nvbugs/5481087)
343341
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_4gpus[ep4-CUTLASS] SKIP (https://nvbugs/5481080)
344-
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_4gpus[ep4-TRTLLM] SKIP (https://nvbugs/5481087)
345342
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_4gpus[dp4-CUTLASS] SKIP (https://nvbugs/5481080)
346-
accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_4gpus[dp4-TRTLLM] SKIP (https://nvbugs/5481087)
347343
accuracy/test_llm_api_pytorch.py::TestEXAONE4::test_auto_dtype SKIP (https://nvbugs/5481090)
348344
test_e2e.py::test_ptp_quickstart_advanced_8gpus_chunked_prefill_sq_22k[Llama-4-Maverick-17B-128E-Instruct-FP8-llama4-models/nvidia/Llama-4-Maverick-17B-128E-Instruct-FP8-False] SKIP (https://nvbugs/5481094)
349345
test_e2e.py::test_ptp_quickstart_advanced_8gpus_chunked_prefill_sq_22k[Llama-4-Maverick-17B-128E-Instruct-FP8-llama4-models/nvidia/Llama-4-Maverick-17B-128E-Instruct-FP8-True] SKIP (https://nvbugs/5481094)
350346
test_e2e.py::test_ptp_quickstart_advanced_8gpus_chunked_prefill_sq_22k[Llama-4-Scout-17B-16E-Instruct-FP8-llama4-models/Llama-4-Scout-17B-16E-Instruct-FP8-True] SKIP (https://nvbugs/5481094)
351347
test_e2e.py::test_ptp_quickstart_multimodal_2gpu[Phi-4-multimodal-instruct-multimodals/Phi-4-multimodal-instruct] SKIP (https://nvbugs/5480415)
348+
accuracy/test_llm_api_pytorch.py::TestLlama4MaverickInstruct::test_fp8_eagle3[tp8-torch_compile=False] SKIP (https://nvbugs/5483534)
349+
accuracy/test_llm_api_pytorch.py::TestLlama4MaverickInstruct::test_fp8_eagle3[tp8-torch_compile=True] SKIP (https://nvbugs/5483615)
350+
accuracy/test_disaggregated_serving.py::TestQwen3_8B::test_nixl_backend SKIP (https://nvbugs/5448748)
351+
accuracy/test_disaggregated_serving.py::TestDeepSeekV3Lite::test_nixl_backend SKIP (https://nvbugs/5448748)

0 commit comments

Comments
 (0)