@@ -2,7 +2,6 @@ name: vLLM Profiling
22
33on :
44 schedule :
5- # Run every week on Sunday at midnight
65 - cron : ' 0 0 * * 0'
76 workflow_dispatch :
87 inputs :
4039 fail-fast : false
4140 matrix :
4241 include :
43- # TODO: Figure out later if we need to scale this up to multiple runners
4442 - runs-on : linux.aws.h100.4
4543 device-name : cuda
4644 runs-on : ${{ matrix.runs-on }}
6159 fetch-depth : 0
6260
6361 - uses : actions/setup-python@v5
64- # Amazon Linux fails on this step
6562 continue-on-error : true
6663 with :
6764 python-version : ' 3.12'
@@ -118,7 +115,6 @@ jobs:
118115 run : |
119116 set -eux
120117
121- # Mimic the logic from vllm ci-infra test template
122118 if [[ "${HEAD_BRANCH}" == "main" ]]; then
123119 DOCKER_IMAGE_PREFIX=public.ecr.aws/q9t5s3a7/vllm-ci-postmerge-repo
124120 else
@@ -143,11 +139,8 @@ jobs:
143139 set -eux
144140
145141 if [[ -z "${HEAD_SHA}" ]]; then
146- # Looking back the latest 100 commits is enough
147142 for i in {0..99}
148143 do
149- # Check if the image is there, if it doesn't then check an older one
150- # because the commit is too recent
151144 HEAD_SHA=$(git rev-parse --verify HEAD~${i})
152145 DOCKER_IMAGE="${DOCKER_IMAGE_PREFIX}:${HEAD_SHA}${DOCKER_IMAGE_SUFFIX}"
153146
@@ -159,8 +152,6 @@ jobs:
159152 fi
160153
161154 echo "HEAD_SHA=$HEAD_SHA" >> $GITHUB_ENV
162-
163- # Print the profiling commit for rereference
164155 echo "### Run profiling on [${HEAD_SHA}](https://github.com/vllm-project/vllm/commit/${HEAD_SHA})" >> "${GITHUB_STEP_SUMMARY}"
165156
166157 - name : Setup CUDA GPU_FLAG for docker run
@@ -182,7 +173,6 @@ jobs:
182173 SCCACHE_REGION : us-east-1
183174 HF_TOKEN : ${{ secrets.HF_TOKEN }}
184175 DOCKER_IMAGE : ${{ env.DOCKER_IMAGE_PREFIX }}:${{ env.HEAD_SHA }}${{ env.DOCKER_IMAGE_SUFFIX }}
185- # vLLM-related environment variables
186176 VLLM_USE_MODELSCOPE : false
187177 VLLM_TORCH_PROFILER_DIR : /tmp/workspace/vllm-profiling/profiling-results
188178 CUDA_VISIBLE_DEVICES : 0
@@ -222,7 +212,6 @@ jobs:
222212 )
223213 docker exec -t "${container_name}" bash -c "cd vllm-profiling && bash ../.github/scripts/run_vllm_profiling.sh"
224214
225- # Keep a copy of the profiling results on GitHub for reference
226215 - uses : actions/upload-artifact@v4
227216 with :
228217 name : profiling-results--${{ env.DEVICE_TYPE }}
0 commit comments