|
33 | 33 | from defs.conftest import (get_device_count, get_device_memory, |
34 | 34 | get_host_total_memory, get_sm_version, |
35 | 35 | skip_fp8_pre_ada, skip_no_nvls, skip_post_blackwell, |
36 | | - skip_pre_ada, skip_pre_blackwell) |
| 36 | + skip_post_blackwell_ultra, skip_pre_ada, |
| 37 | + skip_pre_blackwell) |
37 | 38 | # yapf: enable |
38 | 39 | from defs.trt_test_alternative import check_call, exists |
39 | 40 |
|
@@ -288,6 +289,7 @@ def test_llm_llama_v1_manage_weights_1gpu_summarize(llama_example_root, |
288 | 289 |
|
289 | 290 |
|
290 | 291 | @skip_pre_blackwell |
| 292 | +@skip_post_blackwell_ultra |
291 | 293 | @pytest.mark.parametrize("data_type", ['bfloat16', 'float16']) |
292 | 294 | @pytest.mark.parametrize("fp4_type", ["plugin", "ootb", "disable"], |
293 | 295 | ids=["fp4_plugin", "fp4_ootb", "disable_fp4"]) |
@@ -2187,6 +2189,7 @@ def test_llm_llama_code_llama_1gpu_summary( |
2187 | 2189 | venv_check_call(llm_venv, summary_cmd) |
2188 | 2190 |
|
2189 | 2191 |
|
| 2192 | +@skip_post_blackwell_ultra |
2190 | 2193 | @pytest.mark.timeout(7200) |
2191 | 2194 | @pytest.mark.skip_less_device_memory(40000) |
2192 | 2195 | @pytest.mark.parametrize("num_beams", [1, 4], |
@@ -3383,6 +3386,7 @@ def test_llm_llama_v3_2_smoothquant_1node_single_gpu( |
3383 | 3386 | @pytest.mark.timeout(7200) |
3384 | 3387 | @pytest.mark.skip_less_device_memory(80000) |
3385 | 3388 | @pytest.mark.skip_less_device(4) |
| 3389 | +@skip_post_blackwell_ultra |
3386 | 3390 | @pytest.mark.parametrize("fp8_quant", |
3387 | 3391 | [pytest.param(True, marks=skip_post_blackwell), False], |
3388 | 3392 | ids=['enable_fp8', 'disable_fp8']) |
|
0 commit comments