From 9cfa9b0928ce2cef30441fdab3c375a54813b2bf Mon Sep 17 00:00:00 2001 From: WangJun Date: Mon, 3 Mar 2025 14:41:02 +0800 Subject: [PATCH 1/4] update bmg24 compute runtime --- docker/llm/serving/xpu/docker/Dockerfile | 59 +++++++++++++++++++++++- 1 file changed, 57 insertions(+), 2 deletions(-) diff --git a/docker/llm/serving/xpu/docker/Dockerfile b/docker/llm/serving/xpu/docker/Dockerfile index e07ab654005..e9ada2f60b5 100644 --- a/docker/llm/serving/xpu/docker/Dockerfile +++ b/docker/llm/serving/xpu/docker/Dockerfile @@ -161,7 +161,62 @@ RUN set -eux && \ VLLM_TARGET_DEVICE=xpu pip install --no-build-isolation -v /llm/vllm && \ pip install mpi4py fastapi uvicorn openai && \ pip install gradio==4.43.0 && \ - pip install ray - + pip install ray && \ + # + # Install compute runtime for BMG 24G + # Install igc + apt-get install bison flex python3-mako && \ + mkdir -p /tmp/igc && \ + cd /tmp/igc && \ + git clone https://github.com/intel/vc-intrinsics vc-intrinsics && \ + git clone -b llvmorg-14.0.5 https://github.com/llvm/llvm-project llvm-project && \ + git clone -b ocl-open-140 https://github.com/intel/opencl-clang llvm-project/llvm/projects/opencl-clang && \ + git clone -b llvm_release_140 https://github.com/KhronosGroup/SPIRV-LLVM-Translator llvm-project/llvm/projects/llvm-spirv && \ + git clone https://github.com/KhronosGroup/SPIRV-Tools.git SPIRV-Tools && \ + git clone https://github.com/KhronosGroup/SPIRV-Headers.git SPIRV-Headers && \ + git clone https://github.com/intel/intel-graphics-compiler igc && \ + git config --global user.email "bigdl@intel.com" &&\ + git config --global user.name "IPEX-LLM" && \ + cd igc && \ + mkdir build && \ + cd build && \ + cmake ../ && \ + make -j32 && \ + make install -j32 && \ + rm -rf /tmp/igc && \ + # + apt-get install libigdgmm-dev libigdgmm12 unzip clinfo pciutils && \ + # Install gmmlib + cd /tmp && \ + git clone https://github.com/intel/gmmlib.git && \ + mkdir build && \ + cd build && \ + cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ + make -j32 && \ + make install && \ + cd /tmp && \ + rm -rf /tmp/gmmlib && \ + # Install level-zero + cd /tmp && \ + git clone https://github.com/oneapi-src/level-zero.git && \ + cd level-zero && \ + mkdir build && cd build && \ + cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ + make -j32 && make install && \ + cd /tmp && \ + rm -rf /tmp/level-zero && \ + # Install compute-runtime + wget https://github.com/intel/compute-runtime/archive/refs/tags/24.52.32224.5.zip && \ + unzip 24.52.32224.5.zip && \ + cd compute-runtime-24.52.32224.5 && \ + sed -i '13a \ + DEVICE(0xE210, BmgHwConfig) \ + DEVICE(0xE212, BmgHwConfig) \ + DEVICE(0xE215, BmgHwConfig) \ + DEVICE(0xE216, BmgHwConfig)' ./shared/source/dll/devices/devices_base.inl && \ + sed -i '13s/\(bmgG21DeviceIds{[^}]*\)}/\1, 0xE210, 0xE212, 0xE215, 0xE216}/' ./shared/source/xe2_hpg_core/bmg/definitions/device_ids_configs_bmg.h && \ + mkdir build && cd build && \ + cmake ../ -DSKIP_UNIT_TESTS=ON && \ + make -j32 && make install && \ WORKDIR /llm/ ENTRYPOINT ["bash", "/llm/start-vllm-service.sh"] From 4b6bbc7824308702f7b4cb1ce2e67de985603401 Mon Sep 17 00:00:00 2001 From: WangJun Date: Tue, 4 Mar 2025 02:54:33 +0800 Subject: [PATCH 2/4] update bmg24 compute runtime --- docker/llm/serving/xpu/docker/Dockerfile | 30 ++++++++++-------------- 1 file changed, 13 insertions(+), 17 deletions(-) diff --git a/docker/llm/serving/xpu/docker/Dockerfile b/docker/llm/serving/xpu/docker/Dockerfile index e9ada2f60b5..21409cc96e7 100644 --- a/docker/llm/serving/xpu/docker/Dockerfile +++ b/docker/llm/serving/xpu/docker/Dockerfile @@ -165,7 +165,7 @@ RUN set -eux && \ # # Install compute runtime for BMG 24G # Install igc - apt-get install bison flex python3-mako && \ + apt-get install -y --no-install-recommends bison flex python3-mako && \ mkdir -p /tmp/igc && \ cd /tmp/igc && \ git clone https://github.com/intel/vc-intrinsics vc-intrinsics && \ @@ -178,33 +178,26 @@ RUN set -eux && \ git config --global user.email "bigdl@intel.com" &&\ git config --global user.name "IPEX-LLM" && \ cd igc && \ - mkdir build && \ - cd build && \ + mkdir build && cd build && \ cmake ../ && \ - make -j32 && \ - make install -j32 && \ - rm -rf /tmp/igc && \ + make -j32 && make install -j32 && \ + cd /tmp && rm -rf /tmp/igc && \ # - apt-get install libigdgmm-dev libigdgmm12 unzip clinfo pciutils && \ + apt-get install -y --no-install-recommends libigdgmm-dev libigdgmm12 unzip clinfo pciutils && \ # Install gmmlib - cd /tmp && \ git clone https://github.com/intel/gmmlib.git && \ - mkdir build && \ - cd build && \ + cd gmmlib && \ + mkdir build && cd build && \ cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ - make -j32 && \ - make install && \ - cd /tmp && \ - rm -rf /tmp/gmmlib && \ + make -j32 && make install && \ + cd /tmp && rm -rf /tmp/gmmlib && \ # Install level-zero - cd /tmp && \ git clone https://github.com/oneapi-src/level-zero.git && \ cd level-zero && \ mkdir build && cd build && \ cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ make -j32 && make install && \ - cd /tmp && \ - rm -rf /tmp/level-zero && \ + cd /tmp && rm -rf /tmp/level-zero && \ # Install compute-runtime wget https://github.com/intel/compute-runtime/archive/refs/tags/24.52.32224.5.zip && \ unzip 24.52.32224.5.zip && \ @@ -218,5 +211,8 @@ RUN set -eux && \ mkdir build && cd build && \ cmake ../ -DSKIP_UNIT_TESTS=ON && \ make -j32 && make install && \ + cd /llm && \ + rm -rf /tmp/compute-runtime-24.52.32224.5 && \ + rm -rf /tmp/24.52.32224.5.zip WORKDIR /llm/ ENTRYPOINT ["bash", "/llm/start-vllm-service.sh"] From c6e13bbc9caf9afd9baffc249dd9ea5a9280ef0a Mon Sep 17 00:00:00 2001 From: WangJun Date: Mon, 3 Mar 2025 14:41:02 +0800 Subject: [PATCH 3/4] update bmg24 compute runtime --- docker/llm/serving/xpu/docker/Dockerfile | 59 +++++++++++++++++++++++- 1 file changed, 57 insertions(+), 2 deletions(-) diff --git a/docker/llm/serving/xpu/docker/Dockerfile b/docker/llm/serving/xpu/docker/Dockerfile index e07ab654005..e9ada2f60b5 100644 --- a/docker/llm/serving/xpu/docker/Dockerfile +++ b/docker/llm/serving/xpu/docker/Dockerfile @@ -161,7 +161,62 @@ RUN set -eux && \ VLLM_TARGET_DEVICE=xpu pip install --no-build-isolation -v /llm/vllm && \ pip install mpi4py fastapi uvicorn openai && \ pip install gradio==4.43.0 && \ - pip install ray - + pip install ray && \ + # + # Install compute runtime for BMG 24G + # Install igc + apt-get install bison flex python3-mako && \ + mkdir -p /tmp/igc && \ + cd /tmp/igc && \ + git clone https://github.com/intel/vc-intrinsics vc-intrinsics && \ + git clone -b llvmorg-14.0.5 https://github.com/llvm/llvm-project llvm-project && \ + git clone -b ocl-open-140 https://github.com/intel/opencl-clang llvm-project/llvm/projects/opencl-clang && \ + git clone -b llvm_release_140 https://github.com/KhronosGroup/SPIRV-LLVM-Translator llvm-project/llvm/projects/llvm-spirv && \ + git clone https://github.com/KhronosGroup/SPIRV-Tools.git SPIRV-Tools && \ + git clone https://github.com/KhronosGroup/SPIRV-Headers.git SPIRV-Headers && \ + git clone https://github.com/intel/intel-graphics-compiler igc && \ + git config --global user.email "bigdl@intel.com" &&\ + git config --global user.name "IPEX-LLM" && \ + cd igc && \ + mkdir build && \ + cd build && \ + cmake ../ && \ + make -j32 && \ + make install -j32 && \ + rm -rf /tmp/igc && \ + # + apt-get install libigdgmm-dev libigdgmm12 unzip clinfo pciutils && \ + # Install gmmlib + cd /tmp && \ + git clone https://github.com/intel/gmmlib.git && \ + mkdir build && \ + cd build && \ + cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ + make -j32 && \ + make install && \ + cd /tmp && \ + rm -rf /tmp/gmmlib && \ + # Install level-zero + cd /tmp && \ + git clone https://github.com/oneapi-src/level-zero.git && \ + cd level-zero && \ + mkdir build && cd build && \ + cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ + make -j32 && make install && \ + cd /tmp && \ + rm -rf /tmp/level-zero && \ + # Install compute-runtime + wget https://github.com/intel/compute-runtime/archive/refs/tags/24.52.32224.5.zip && \ + unzip 24.52.32224.5.zip && \ + cd compute-runtime-24.52.32224.5 && \ + sed -i '13a \ + DEVICE(0xE210, BmgHwConfig) \ + DEVICE(0xE212, BmgHwConfig) \ + DEVICE(0xE215, BmgHwConfig) \ + DEVICE(0xE216, BmgHwConfig)' ./shared/source/dll/devices/devices_base.inl && \ + sed -i '13s/\(bmgG21DeviceIds{[^}]*\)}/\1, 0xE210, 0xE212, 0xE215, 0xE216}/' ./shared/source/xe2_hpg_core/bmg/definitions/device_ids_configs_bmg.h && \ + mkdir build && cd build && \ + cmake ../ -DSKIP_UNIT_TESTS=ON && \ + make -j32 && make install && \ WORKDIR /llm/ ENTRYPOINT ["bash", "/llm/start-vllm-service.sh"] From d7aaf243a1263396bc74ac94b01f0ddce9f38507 Mon Sep 17 00:00:00 2001 From: WangJun Date: Tue, 4 Mar 2025 02:54:33 +0800 Subject: [PATCH 4/4] update bmg24 compute runtime --- docker/llm/serving/xpu/docker/Dockerfile | 30 ++++++++++-------------- 1 file changed, 13 insertions(+), 17 deletions(-) diff --git a/docker/llm/serving/xpu/docker/Dockerfile b/docker/llm/serving/xpu/docker/Dockerfile index e9ada2f60b5..21409cc96e7 100644 --- a/docker/llm/serving/xpu/docker/Dockerfile +++ b/docker/llm/serving/xpu/docker/Dockerfile @@ -165,7 +165,7 @@ RUN set -eux && \ # # Install compute runtime for BMG 24G # Install igc - apt-get install bison flex python3-mako && \ + apt-get install -y --no-install-recommends bison flex python3-mako && \ mkdir -p /tmp/igc && \ cd /tmp/igc && \ git clone https://github.com/intel/vc-intrinsics vc-intrinsics && \ @@ -178,33 +178,26 @@ RUN set -eux && \ git config --global user.email "bigdl@intel.com" &&\ git config --global user.name "IPEX-LLM" && \ cd igc && \ - mkdir build && \ - cd build && \ + mkdir build && cd build && \ cmake ../ && \ - make -j32 && \ - make install -j32 && \ - rm -rf /tmp/igc && \ + make -j32 && make install -j32 && \ + cd /tmp && rm -rf /tmp/igc && \ # - apt-get install libigdgmm-dev libigdgmm12 unzip clinfo pciutils && \ + apt-get install -y --no-install-recommends libigdgmm-dev libigdgmm12 unzip clinfo pciutils && \ # Install gmmlib - cd /tmp && \ git clone https://github.com/intel/gmmlib.git && \ - mkdir build && \ - cd build && \ + cd gmmlib && \ + mkdir build && cd build && \ cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ - make -j32 && \ - make install && \ - cd /tmp && \ - rm -rf /tmp/gmmlib && \ + make -j32 && make install && \ + cd /tmp && rm -rf /tmp/gmmlib && \ # Install level-zero - cd /tmp && \ git clone https://github.com/oneapi-src/level-zero.git && \ cd level-zero && \ mkdir build && cd build && \ cmake ../ -DCMAKE_INSTALL_PREFIX=/usr && \ make -j32 && make install && \ - cd /tmp && \ - rm -rf /tmp/level-zero && \ + cd /tmp && rm -rf /tmp/level-zero && \ # Install compute-runtime wget https://github.com/intel/compute-runtime/archive/refs/tags/24.52.32224.5.zip && \ unzip 24.52.32224.5.zip && \ @@ -218,5 +211,8 @@ RUN set -eux && \ mkdir build && cd build && \ cmake ../ -DSKIP_UNIT_TESTS=ON && \ make -j32 && make install && \ + cd /llm && \ + rm -rf /tmp/compute-runtime-24.52.32224.5 && \ + rm -rf /tmp/24.52.32224.5.zip WORKDIR /llm/ ENTRYPOINT ["bash", "/llm/start-vllm-service.sh"]