File tree Expand file tree Collapse file tree 2 files changed +4
-2
lines changed
Expand file tree Collapse file tree 2 files changed +4
-2
lines changed Original file line number Diff line number Diff line change @@ -186,7 +186,7 @@ jobs:
186186 # Verify installations
187187 echo "$(pwd)/sgl_server_env/bin" >> $GITHUB_PATH
188188
189- - name : Install NVCC
189+ - name : Install NVCC # TODO: Use docker image (nvidia/cuda:12.8.1-devel-ubuntu22.04) instead of locally specifying the variables
190190 if : env.DEVICE_NAME == 'cuda'
191191 shell : bash
192192 run : |
Original file line number Diff line number Diff line change 1+ # TODO: Refactor the workflows to extract the common parts into a GHA reusable module
12name : vLLM Profiling
23
34on :
1415 description : vLLM commit (optional, default to the latest commit in the branch that has not yet been benchmarked)
1516 required : false
1617 type : string
18+ # TODO: add support for profiling on a specific model and runner
1719 pull_request :
1820 paths :
1921 - .github/workflows/vllm-profiling.yml
3941 fail-fast : false
4042 matrix :
4143 include :
42- - runs-on : linux.aws.h100.4
44+ - runs-on : linux.aws.a100
4345 device-name : cuda
4446 runs-on : ${{ matrix.runs-on }}
4547 environment : pytorch-x-vllm
You can’t perform that action at this time.
0 commit comments