diff --git a/.github/workflows/vllm-benchmark.yml b/.github/workflows/vllm-benchmark.yml index 5a818ea..beda40b 100644 --- a/.github/workflows/vllm-benchmark.yml +++ b/.github/workflows/vllm-benchmark.yml @@ -198,6 +198,9 @@ jobs: echo "HEAD_SHA=$HEAD_SHA" >> $GITHUB_ENV + # Print the benchmark commit for rereference + echo "### Run benchmark on [${HEAD_SHA}](https://github.com/vllm-project/vllm/commit/${HEAD_SHA})" >> "${GITHUB_STEP_SUMMARY}" + - name: Setup CUDA GPU_FLAG for docker run if: env.DEVICE_NAME == 'cuda' run: | @@ -274,6 +277,12 @@ jobs: ) docker exec -t "${container_name}" bash -c "cd vllm-benchmarks/vllm && bash .buildkite/nightly-benchmarks/scripts/run-performance-benchmarks.sh" + # Keep a copy of the benchmark results on GitHub for reference + - uses: actions/upload-artifact@v4 + with: + name: benchmark-results + path: vllm-benchmarks/vllm/benchmarks/results + - name: Authenticate with AWS # AWS CUDA runners already have access to the bucket via its runner IAM role if: env.DEVICE_NAME != 'cuda'