@@ -134,7 +134,8 @@ jobs:
134
134
pip install -r .github/scripts/requirements.txt \
135
135
--extra-index-url https://download.pytorch.org/whl/rocm6.3
136
136
else
137
- pip install -r .github/scripts/requirements.txt
137
+ pip install -r .github/scripts/requirements.txt \
138
+ --extra-index-url https://download.pytorch.org/whl/cu128
138
139
fi
139
140
140
141
- name : Set Docker registry
@@ -277,15 +278,9 @@ jobs:
277
278
)
278
279
docker exec -t "${container_name}" bash -c "cd vllm-benchmarks/vllm && bash .buildkite/nightly-benchmarks/scripts/run-performance-benchmarks.sh"
279
280
280
- # Keep a copy of the benchmark results on GitHub for reference
281
- - uses : actions/upload-artifact@v4
282
- with :
283
- name : benchmark-results
284
- path : vllm-benchmarks/vllm/benchmarks/results
285
-
286
281
- name : Authenticate with AWS
287
282
# AWS CUDA runners already have access to the bucket via its runner IAM role
288
- if : env.DEVICE_NAME != 'cuda'
283
+ if : env.DEVICE_NAME == 'rocm' || contains(env.DEVICE_TYPE, 'B200')
289
284
uses : aws-actions/configure-aws-credentials@ececac1a45f3b08a01d2dd070d28d111c5fe6722 # v4.1.0
290
285
with :
291
286
role-to-assume : arn:aws:iam::308535385114:role/gha_workflow_upload-benchmark-results
@@ -304,10 +299,21 @@ jobs:
304
299
ls -lah "${BENCHMARK_RESULTS}"
305
300
306
301
SANITIZED_DEVICE_TYPE=$(echo "${DEVICE_TYPE// /_}" | sed "s/[^[:alnum:].-]/_/g")
302
+ SANITIZED_MODELS="${MODELS//\//_}"
303
+
307
304
python3 .github/scripts/upload_benchmark_results.py \
308
305
--repo vllm-benchmarks/vllm \
309
306
--benchmark-name "vLLM benchmark" \
310
307
--benchmark-results "${BENCHMARK_RESULTS}" \
311
308
--device-name "${DEVICE_NAME}" \
312
309
--device-type "${SANITIZED_DEVICE_TYPE}" \
313
- --model "${MODELS//\//_}"
310
+ --model "${SANITIZED_MODELS}"
311
+
312
+ echo "SANITIZED_DEVICE_TYPE=$SANITIZED_DEVICE_TYPE" >> $GITHUB_ENV
313
+ echo "SANITIZED_MODELS=$SANITIZED_MODELS" >> $GITHUB_ENV
314
+
315
+ # Keep a copy of the benchmark results on GitHub for reference
316
+ - uses : actions/upload-artifact@v4
317
+ with :
318
+ name : benchmark-results--${{ env.SANITIZED_DEVICE_TYPE }}-${{ env.SANITIZED_MODELS }}
319
+ path : vllm-benchmarks/vllm/benchmarks/results
0 commit comments