diff --git a/.buildkite/test-pipeline.yaml b/.buildkite/test-pipeline.yaml index 4edd1cadfb2f0..535f6c612374f 100644 --- a/.buildkite/test-pipeline.yaml +++ b/.buildkite/test-pipeline.yaml @@ -132,7 +132,7 @@ steps: parallelism: 4 - label: LoRA Long Context (Distributed) - #mirror_hardwares: [amd] + mirror_hardwares: [amd] num_gpus: 4 # This test runs llama 13B, so it is required to run on 4 GPUs. commands: diff --git a/Dockerfile.rocm b/Dockerfile.rocm index e30a2aaf30209..49464f6f75953 100644 --- a/Dockerfile.rocm +++ b/Dockerfile.rocm @@ -1,15 +1,15 @@ # default base image -ARG BASE_IMAGE="rocm/pytorch:rocm6.0_ubuntu20.04_py3.9_pytorch_2.1.1" +ARG BASE_IMAGE="rocm/pytorch:rocm6.1_ubuntu20.04_py3.9_pytorch_2.1.2" FROM $BASE_IMAGE -ARG BASE_IMAGE="rocm/pytorch:rocm6.0_ubuntu20.04_py3.9_pytorch_2.1.1" +ARG BASE_IMAGE="rocm/pytorch:rocm6.1_ubuntu20.04_py3.9_pytorch_2.1.2" RUN echo "Base image is $BASE_IMAGE" # BASE_IMAGE for ROCm_5.7: "rocm/pytorch:rocm5.7_ubuntu22.04_py3.10_pytorch_2.0.1" # BASE_IMAGE for ROCm_6.0: "rocm/pytorch:rocm6.0_ubuntu20.04_py3.9_pytorch_2.1.1" - +# BASE_IMAGE for ROCm_6.1: "rocm/pytorch:rocm6.1_ubuntu20.04_py3.9_pytorch_2.1.2" ARG FA_GFX_ARCHS="gfx90a;gfx942" RUN echo "FA_GFX_ARCHS is $FA_GFX_ARCHS" @@ -104,7 +104,6 @@ ENV VLLM_NCCL_SO_PATH=/opt/rocm/lib/librccl.so RUN --mount=type=cache,target=/root/.cache/pip \ pip install -U -r requirements-rocm.txt \ - && patch /opt/rocm/include/hip/amd_detail/amd_hip_bf16.h ./rocm_patch/rocm_bf16.patch \ && python3 setup.py install \ && cp build/lib.linux-x86_64-cpython-39/vllm/_C.cpython-39-x86_64-linux-gnu.so vllm/ \ && cp build/lib.linux-x86_64-cpython-39/vllm/_punica_C.cpython-39-x86_64-linux-gnu.so vllm/ \