Skip to content

Commit 2df0e9b

Browse files
Rocm vllm ci fix (new design) (#475)
Rocm vllm ci fixing Signed-off-by: Alexei V. Ivanov <[email protected]> --------- Signed-off-by: Alexei V. Ivanov <[email protected]>
1 parent b758abb commit 2df0e9b

File tree

2 files changed

+11
-3
lines changed

2 files changed

+11
-3
lines changed

.buildkite/run-amd-test.sh

+1-1
Original file line numberDiff line numberDiff line change
@@ -57,7 +57,7 @@ while true; do
5757
done
5858

5959
echo "--- Pulling container"
60-
image_name="rocm/vllm-ci:${BUILDKITE_COMMIT}"
60+
image_name="rocm/vllm-ci-private:${BUILDKITE_COMMIT}"
6161
container_name="rocm_${BUILDKITE_COMMIT}_$(tr -dc A-Za-z0-9 < /dev/urandom | head -c 10; echo)"
6262
docker pull "${image_name}"
6363

.buildkite/test-template.j2

+10-2
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,13 @@
11
{% set docker_image = "public.ecr.aws/q9t5s3a7/vllm-ci-test-repo:$BUILDKITE_COMMIT" %}
2-
{% set docker_image_amd = "rocm/vllm-ci:$BUILDKITE_COMMIT" %}
2+
{% set docker_image_amd = "rocm/vllm-ci-private:$BUILDKITE_COMMIT" %}
33
{% set default_working_dir = "vllm/tests" %}
44
{% set hf_home = "/root/.cache/huggingface" %}
55

66
steps:
77
- label: ":docker: build image"
88
depends_on: ~
99
commands:
10-
- "docker build --build-arg max_jobs=16 --tag {{ docker_image_amd }} -f Dockerfile.rocm --target test --progress plain ."
10+
- "docker build --build-arg max_jobs=16 --tag {{ docker_image_amd }} -f Dockerfile.rocm --build-arg ARG_PYTORCH_ROCM_ARCH='gfx90a;gfx942' --target test --progress plain ."
1111
- "docker push {{ docker_image_amd }}"
1212
key: "amd-build"
1313
env:
@@ -27,7 +27,15 @@ steps:
2727
depends_on:
2828
- "amd-build"
2929
agents:
30+
{% if step.amd_gpus and step.amd_gpus==8%}
3031
queue: amd_gpu
32+
{% elif step.amd_gpus and step.amd_gpus==4%}
33+
queue: amd_gpu
34+
{% elif step.amd_gpus and step.amd_gpus==2%}
35+
queue: amd_gpu
36+
{% else%}
37+
queue: amd_gpu
38+
{% endif%}
3139
commands:
3240
- bash .buildkite/run-amd-test.sh "cd {{ (step.working_dir or default_working_dir) | safe }} ; {{ step.command or (step.commands | join(" && ")) | safe }}"
3341
env:

0 commit comments

Comments
 (0)