Skip to content

Commit 56e97a1

Browse files
committed
add mtp3 tests.
Signed-off-by: Fanrong Li <23290157+lfr-0531@users.noreply.github.com>
1 parent d5b7d43 commit 56e97a1

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

tests/integration/defs/accuracy/test_llm_api_pytorch.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2380,7 +2380,7 @@ class TestDeepSeekV32(LlmapiAccuracyTestHarness):
23802380
(8, 1, 8, 0, False, True, True, True, 24, "_DEFAULT"),
23812381
(8, 1, 8, 1, False, True, True, True, 24, "_DEFAULT"),
23822382
(8, 1, 8, 0, True, True, True, True, 24, "_DEFAULT"),
2383-
(8, 1, 8, 1, False, False, True, True, 1, "TRTLLM"),
2383+
(8, 1, 8, 3, False, False, True, True, 1, "TRTLLM"),
23842384
],
23852385
ids=["baseline", "baseline_mtp1", "baseline_fp8kv", "latency"])
23862386
def test_fp8_blockscale(self, tp_size, pp_size, ep_size, mtp_nextn, fp8kv,
@@ -2448,7 +2448,7 @@ def test_fp8_blockscale(self, tp_size, pp_size, ep_size, mtp_nextn, fp8kv,
24482448
(8, 1, 8, 0, False, True, True, True, 24, "CUTLASS"),
24492449
(8, 1, 8, 1, False, True, True, True, 24, "CUTLASS"),
24502450
(8, 1, 8, 0, True, True, True, True, 24, "CUTLASS"),
2451-
(8, 1, 8, 1, False, False, True, True, 1, "TRTLLM"),
2451+
(8, 1, 8, 3, False, False, True, True, 1, "TRTLLM"),
24522452
],
24532453
ids=["baseline", "baseline_mtp1", "baseline_fp8kv", "latency"])
24542454
def test_nvfp4_multi_gpus(self, tp_size, pp_size, ep_size, mtp_nextn, fp8kv,

0 commit comments

Comments
 (0)