@@ -110,35 +110,36 @@ jobs:
110
110
111
111
- name : Install SGLANG
112
112
run : |
113
- SGLANG_PIN="$(<.github/pins/sglang.txt)"
114
- pip install sglang==$SGLANG_PIN
113
+ git clone https://github.com/sgl-project/sglang.git
114
+ cd sglang/python
115
+ pip install .
115
116
116
117
- name : Run SGLANG attention prefill stage benchmark
117
118
if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'prefill_attention_benchmark.py') }}
118
119
run : |
119
120
cd benchmarks/third_party/sglang
120
- python prefill_attention_benchmark --reports $REPORTS
121
+ python prefill_attention_benchmark.py --reports $REPORTS
121
122
122
- source ../../scripts/capture-hw-details.sh
123
- python ../../scripts/build_report.py $REPORTS/prefill-attn-performance.csv $REPORTS/attn-prefill-triton-report.csv --benchmark attn --compiler triton --param_cols "B,N_CTX,H_Q,H_KV,D,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
123
+ source ../../../ scripts/capture-hw-details.sh
124
+ python ../../../ scripts/build_report.py $REPORTS/prefill-attn-performance.csv $REPORTS/attn-prefill-triton-report.csv --benchmark sglang-prefill- attn --compiler triton --param_cols "B,N_CTX,H_Q,H_KV,D,CAUSAL" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
124
125
125
126
- name : Run SGLANG attention decode stage benchmark
126
127
if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'decode_attention_benchmark.py') }}
127
128
run : |
128
129
cd benchmarks/third_party/sglang
129
- python decode_attention_benchmark --reports $REPORTS
130
+ python decode_attention_benchmark.py --reports $REPORTS
130
131
131
- source ../../scripts/capture-hw-details.sh
132
- python ../../scripts/build_report.py $REPORTS/decode-attn-performance.csv $REPORTS/attn-decode-triton-report.csv --benchmark attn --compiler triton --param_cols "B,N_CTX,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
132
+ source ../../../ scripts/capture-hw-details.sh
133
+ python ../../../ scripts/build_report.py $REPORTS/decode-attn-performance.csv $REPORTS/attn-decode-triton-report.csv --benchmark sglang-decode- attn --compiler triton --param_cols "B,N_CTX,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
133
134
134
135
- name : Run SGLANG attention append stage benchmark
135
136
if : ${{ steps.install.outcome == 'success' && !cancelled() && !contains(fromJson(inputs.skip_benchmarks || '[]'), 'decode_attention_benchmark.py') }}
136
137
run : |
137
138
cd benchmarks/third_party/sglang
138
- python extended_attention_benchmark --reports $REPORTS
139
+ python extended_attention_benchmark.py --reports $REPORTS
139
140
140
- source ../../scripts/capture-hw-details.sh
141
- python ../../scripts/build_report.py $REPORTS/extended-attn-performance.csv $REPORTS/attn-append-triton-report.csv --benchmark attn --compiler triton --param_cols "B,N_CTX,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
141
+ source ../../../ scripts/capture-hw-details.sh
142
+ python ../../../ scripts/build_report.py $REPORTS/extended-attn-performance.csv $REPORTS/attn-append-triton-report.csv --benchmark sglang-extended- attn --compiler triton --param_cols "B,N_CTX,H_Q,H_KV,D" --tflops_col Triton-TFlops --hbm_col "Triton-GB/s" --tag $TAG
142
143
143
144
- name : Upload benchmark reports
144
145
if : ${{ steps.install.outcome == 'success' && !cancelled() }}
0 commit comments