Skip to content

Commit 756614a

Browse files
airMengleonling-ll
authored andcommitted
add sglang block fp8 gemm into benchmark
fix bugs rtol atol
1 parent 5a2076d commit 756614a

File tree

2 files changed

+396
-0
lines changed

2 files changed

+396
-0
lines changed

.github/workflows/triton-benchmarks.yml

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -268,6 +268,14 @@ jobs:
268268
source ../../scripts/capture-hw-details.sh
269269
python build_report.py $REPORTS/prefix-sums.csv $REPORTS/prefix_sums-triton-report.csv --benchmark prefix_sums --compiler triton --param_cols "N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
270270
271+
- name: Run SGLang FP8 GEMM benchmark
272+
if: ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'prefix_sums.py') }}
273+
run: |
274+
cd benchmarks/triton_kernels_benchmark/sglang
275+
python block_fp8_matmul.py --reports $REPORTS
276+
source ../../scripts/capture-hw-details.sh
277+
python ../../scripts/build_report.py $REPORTS/block_fp8_matmul.csv $REPORTS/block_fp8_matmul-triton-report.csv --benchmark block_fp8_matmul --compiler triton --param_cols "N" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
278+
271279
- name: Run micro benchmark
272280
if: ${{ steps.install.outcome == 'success' && !cancelled() && (inputs.benchmarks == '' || contains(fromJson(inputs.benchmarks || '[]'), 'micro_benchmarks.py')) && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'micro_benchmarks') }}
273281
run: |

0 commit comments

Comments
 (0)