@@ -114,31 +114,31 @@ jobs:
114
114
pip install sglang/python[srt_xpu]
115
115
116
116
- name : Run SGLANG attention prefill stage benchmark
117
- if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'prefill_attention_benchmark.py') }}
117
+ if : ${{ steps.install.outcome == 'success' && !cancelled() }}
118
118
run : |
119
119
cd benchmarks/third_party/sglang
120
120
python prefill_attention_benchmark.py --reports $REPORTS
121
121
122
122
source ../../../scripts/capture-hw-details.sh
123
- python ../../../scripts/ build_report.py $REPORTS/prefill-attn-performance.csv $REPORTS/attn-prefill-triton-report.csv --benchmark sglang-prefill-attn --compiler triton --param_cols "B,N_CTX ,H_Q,H_KV,D,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
123
+ python ../../triton_kernels_benchmark/ build_report.py $REPORTS/prefill-attn-performance.csv $REPORTS/attn-prefill-triton-report.csv --benchmark sglang-prefill-attn --compiler triton --param_cols "B,SEQ_LENS ,H_Q,H_KV,D,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
124
124
125
125
- name : Run SGLANG attention decode stage benchmark
126
- if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'decode_attention_benchmark.py') }}
126
+ if : ${{ steps.install.outcome == 'success' && !cancelled() }}
127
127
run : |
128
128
cd benchmarks/third_party/sglang
129
129
python decode_attention_benchmark.py --reports $REPORTS
130
130
131
131
source ../../../scripts/capture-hw-details.sh
132
- python ../../../scripts/ build_report.py $REPORTS/decode-attn-performance.csv $REPORTS/attn-decode-triton-report.csv --benchmark sglang-decode-attn --compiler triton --param_cols "B,N_CTX ,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
132
+ python ../../triton_kernels_benchmark/ build_report.py $REPORTS/decode-attn-performance.csv $REPORTS/attn-decode-triton-report.csv --benchmark sglang-decode-attn --compiler triton --param_cols "B,SEQ_LENS ,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
133
133
134
134
- name : Run SGLANG attention append stage benchmark
135
- if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'decode_attention_benchmark.py') }}
135
+ if : ${{ steps.install.outcome == 'success' && !cancelled() }}
136
136
run : |
137
137
cd benchmarks/third_party/sglang
138
138
python extended_attention_benchmark.py --reports $REPORTS
139
139
140
140
source ../../../scripts/capture-hw-details.sh
141
- python ../../../scripts/ build_report.py $REPORTS/extended-attn-performance.csv $REPORTS/attn-append-triton-report.csv --benchmark sglang-extended-attn --compiler triton --param_cols "B,N_CTX ,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
141
+ python ../../triton_kernels_benchmark/ build_report.py $REPORTS/extended-attn-performance.csv $REPORTS/attn-append-triton-report.csv --benchmark sglang-extended-attn --compiler triton --param_cols "B,SEQ_LENS ,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
142
142
143
143
- name : Upload benchmark reports
144
144
if : ${{ steps.install.outcome == 'success' && !cancelled() }}
0 commit comments