Skip to content

Commit b43b5e2

Browse files
committed
remove sglang benchmark from triton-benchmarks
1 parent 1bd8840 commit b43b5e2

File tree

2 files changed

+13
-1
lines changed

2 files changed

+13
-1
lines changed

.github/workflows/triton-benchmarks.yml

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -258,6 +258,18 @@ jobs:
258258
python ../../scripts/build_report.py $REPORTS/attn-performance.csv $REPORTS/attn-triton-report.csv --benchmark attn --compiler triton --param_cols "Z,H,N_CTX,D_HEAD,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
259259
python ../../scripts/build_report.py $REPORTS/attn-performance.csv $REPORTS/attn-xetla-report.csv --benchmark attn --compiler xetla --param_cols "Z,H,N_CTX,D_HEAD,CAUSAL" --tflops_col XeTLA-TFlops --hbm_col "XeTLA-GB/s" --tag $TAG
260260
261+
- name: Run Triton FA fwd kernel benchmark - advanced path
262+
if: ${{ steps.install.outcome == 'success' && !cancelled() && (inputs.benchmarks == '' || contains(fromJson(inputs.benchmarks || '[]'), 'flash_attention_benchmark.py_advanced')) && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'flash_attention_benchmark.py_advanced') }}
263+
run: |
264+
cd benchmarks/triton_kernels_benchmark
265+
TRITON_INTEL_ADVANCED_PATH=1 \
266+
IGC_VISAOptions=" -enableBCR" \
267+
python flash_attention_benchmark.py --reports $REPORTS --n_runs $N_RUNS
268+
269+
TAG="${TAG}-adv"
270+
source ../../scripts/capture-hw-details.sh
271+
python ../../scripts/build_report.py $REPORTS/attn-performance.csv $REPORTS/attn-triton-advanced-report.csv --benchmark attn --compiler triton --param_cols "Z,H,N_CTX,D_HEAD,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
272+
261273
- name: Run Triton FA bwd kernel benchmark
262274
if: ${{ steps.install.outcome == 'success' && !cancelled() && (inputs.benchmarks == '' || contains(fromJson(inputs.benchmarks || '[]'), 'flash_attention_bwd_benchmark.py')) && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'flash_attention_bwd_benchmark.py') }}
263275
run: |

python/src/ir.cc

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1782,7 +1782,7 @@ void init_triton_ir(py::module &&m) {
17821782
context->disableMultithreading();
17831783
auto printingFlags = OpPrintingFlags();
17841784
printingFlags.elideLargeElementsAttrs(16);
1785-
// printingFlags.enableDebugInfo();
1785+
printingFlags.enableDebugInfo();
17861786
auto printAlways = [funcToDump](Pass *, Operation *op) -> bool {
17871787
if (funcToDump.empty())
17881788
return true;

0 commit comments

Comments
 (0)