Skip to content

Commit 793c634

Browse files
committed
Add 4th draft of mm_fp4 backend -- enable cross-backend autotune on auto, but no cudnn autotune
1 parent 80f76e0 commit 793c634

File tree

2 files changed

+283
-268
lines changed

2 files changed

+283
-268
lines changed

benchmarks/routines/gemm.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -790,7 +790,7 @@ def testMmFp4(args):
790790
run_refcheck = args.refcheck
791791
use_128x4_sf_layout = args.use_128x4_sf_layout
792792
use_nvfp4 = args.use_nvfp4
793-
autotune_supported_backends = ["cutlass", "trtllm", "auto"]
793+
autotune_supported_backends = ["cudnn", "cutlass", "trtllm", "auto"]
794794
res = []
795795

796796
backends = filter_backends_by_compute_capability(backends, args.routine, device)

0 commit comments

Comments
 (0)