Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions .github/workflows/flash_attention.yml
Original file line number Diff line number Diff line change
Expand Up @@ -19,10 +19,10 @@ jobs:
runs-on: linux.dgx.b200.8
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- name: Checkout Flash Attention repository
uses: actions/checkout@v4
uses: actions/checkout@v6
with:
repository: Dao-AILab/flash-attention
path: fa4
Expand Down
12 changes: 6 additions & 6 deletions .github/workflows/sglang-benchmark.yml
Original file line number Diff line number Diff line change
Expand Up @@ -38,9 +38,9 @@ jobs:
benchmark_matrix: ${{ steps.set-parameters.outputs.benchmark_matrix }}
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
with:
python-version: '3.12'

Expand Down Expand Up @@ -76,7 +76,7 @@ jobs:
contents: read
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- name: Install system dependencies
shell: bash
Expand All @@ -85,14 +85,14 @@ jobs:
sudo apt-get install -y libnuma-dev numactl

- name: Checkout SGLang repository
uses: actions/checkout@v4
uses: actions/checkout@v6
with:
repository: sgl-project/sglang
path: sglang-benchmarks/sglang
ref: ${{ inputs.sglang_branch || 'main' }}
fetch-depth: 0

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
# Amazon Linux fails on this step
continue-on-error: true
with:
Expand Down Expand Up @@ -327,7 +327,7 @@ jobs:
echo "SANITIZED_MODELS=$SANITIZED_MODELS" >> $GITHUB_ENV

# Keep a copy of the benchmark results on GitHub for reference
- uses: actions/upload-artifact@v4
- uses: actions/upload-artifact@v6
if: always()
with:
name: sglang-benchmark-results-${{ env.SANITIZED_DEVICE_TYPE }}-${{ env.SANITIZED_MODELS }}
Expand Down
12 changes: 6 additions & 6 deletions .github/workflows/tritonbench.yml
Original file line number Diff line number Diff line change
Expand Up @@ -34,9 +34,9 @@ jobs:
benchmark_matrix: ${{ steps.set-parameters.outputs.benchmark_matrix }}
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
with:
python-version: '3.12'

Expand Down Expand Up @@ -73,7 +73,7 @@ jobs:
contents: read
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- name: Install system dependencies
shell: bash
Expand All @@ -82,14 +82,14 @@ jobs:
sudo apt-get install -y libnuma-dev numactl

- name: Checkout TritonBench repository
uses: actions/checkout@v4
uses: actions/checkout@v6
with:
repository: meta-pytorch/tritonbench
path: triton-benchmarks/tritonbench
ref: ${{ inputs.tritonbench_branch || 'main' }}
fetch-depth: 0

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
# Amazon Linux fails on this step
continue-on-error: true
with:
Expand Down Expand Up @@ -205,7 +205,7 @@ jobs:
aws-region: us-east-1

# Keep a copy of the benchmark results on GitHub for reference
- uses: actions/upload-artifact@v4
- uses: actions/upload-artifact@v6
if: always()
with:
name: ${{ env.JOB_NAME }}
Expand Down
12 changes: 6 additions & 6 deletions .github/workflows/vllm-benchmark.yml
Original file line number Diff line number Diff line change
Expand Up @@ -45,9 +45,9 @@ jobs:
benchmark_matrix: ${{ steps.set-parameters.outputs.benchmark_matrix }}
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
with:
python-version: '3.12'

Expand Down Expand Up @@ -84,17 +84,17 @@ jobs:
sudo -n chown -R $USER:$USER $GITHUB_WORKSPACE || true

- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- name: Checkout vLLM repository
uses: actions/checkout@v4
uses: actions/checkout@v6
with:
repository: vllm-project/vllm
path: vllm-benchmarks/vllm
ref: ${{ inputs.vllm_branch || 'main' }}
fetch-depth: 0

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
# Amazon Linux fails on this step
continue-on-error: true
with:
Expand Down Expand Up @@ -381,7 +381,7 @@ jobs:
echo "SANITIZED_MODELS=$SANITIZED_MODELS" >> $GITHUB_ENV

# Keep a copy of the benchmark results on GitHub for reference
- uses: actions/upload-artifact@v4
- uses: actions/upload-artifact@v6
with:
name: benchmark-results--${{ env.SANITIZED_DEVICE_TYPE }}-${{ env.SANITIZED_MODELS }}
path: vllm-benchmarks/vllm/benchmarks/results
4 changes: 2 additions & 2 deletions .github/workflows/vllm-ci-test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -42,10 +42,10 @@ jobs:
environment: pytorch-x-vllm
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- name: Checkout vLLM repository
uses: actions/checkout@v4
uses: actions/checkout@v6
with:
repository: vllm-project/vllm
path: vllm
Expand Down
12 changes: 6 additions & 6 deletions .github/workflows/vllm-profiling.yml
Original file line number Diff line number Diff line change
Expand Up @@ -29,9 +29,9 @@ jobs:
runs-on: ubuntu-latest
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
with:
python-version: '3.12'
profiling:
Expand All @@ -51,17 +51,17 @@ jobs:
contents: read
steps:
- name: Checkout repository
uses: actions/checkout@v4
uses: actions/checkout@v6

- name: Checkout vLLM repository
uses: actions/checkout@v4
uses: actions/checkout@v6
with:
repository: vllm-project/vllm
path: vllm-profiling/vllm
ref: ${{ inputs.vllm_branch || 'main' }}
fetch-depth: 0

- uses: actions/setup-python@v5
- uses: actions/setup-python@v6
continue-on-error: true
with:
python-version: '3.12'
Expand Down Expand Up @@ -236,7 +236,7 @@ jobs:
path: vllm-profiling/profiling-results
if-no-files-found: warn

- uses: actions/upload-artifact@v4
- uses: actions/upload-artifact@v6
with:
name: profiling-results--${{ env.DEVICE_TYPE }}
path: vllm-profiling/profiling-results