Skip to content

Commit fb7578a

Browse files
committed
add mtp3 tests.
Signed-off-by: Fanrong Li <23290157+lfr-0531@users.noreply.github.com>
1 parent b3ecd48 commit fb7578a

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

tests/integration/defs/accuracy/test_llm_api_pytorch.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2380,7 +2380,7 @@ class TestDeepSeekV32(LlmapiAccuracyTestHarness):
23802380
(8, 1, 8, 0, False, True, True, True, 24, "_DEFAULT"),
23812381
(8, 1, 8, 1, False, True, True, True, 24, "_DEFAULT"),
23822382
(8, 1, 8, 0, True, True, True, True, 24, "_DEFAULT"),
2383-
(8, 1, 8, 1, False, False, True, True, 1, "TRTLLM"),
2383+
(8, 1, 8, 3, False, False, True, True, 1, "TRTLLM"),
23842384
],
23852385
ids=["baseline", "baseline_mtp1", "baseline_fp8kv", "latency"])
23862386
def test_fp8_blockscale(self, tp_size, pp_size, ep_size, mtp_nextn, fp8kv,
@@ -2448,7 +2448,7 @@ def test_fp8_blockscale(self, tp_size, pp_size, ep_size, mtp_nextn, fp8kv,
24482448
(8, 1, 8, 0, False, True, True, True, 24, "CUTLASS"),
24492449
(8, 1, 8, 1, False, True, True, True, 24, "CUTLASS"),
24502450
(8, 1, 8, 0, True, True, True, True, 24, "CUTLASS"),
2451-
(8, 1, 8, 1, False, False, True, True, 1, "TRTLLM"),
2451+
(8, 1, 8, 3, False, False, True, True, 1, "TRTLLM"),
24522452
],
24532453
ids=["baseline", "baseline_mtp1", "baseline_fp8kv", "latency"])
24542454
def test_nvfp4_multi_gpus(self, tp_size, pp_size, ep_size, mtp_nextn, fp8kv,

0 commit comments

Comments
 (0)