opea-project · CICD-at-OPEA · May 8, 2025 · May 16, 2025 · May 20, 2025 · May 20, 2025
@@ -3,4 +3,4 @@
 # SPDX-License-Identifier: Apache-2.0
 
 export VLLM_VER=v0.10.0
-export VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+export VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
@@ -20,7 +20,7 @@ services:
   vllm-gaudi:
     build:
       context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      dockerfile: docker/Dockerfile.hpu
     extends: agent
     image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   vllm-rocm:

@@ -41,7 +41,7 @@ function build_agent_docker_image_gaudi_vllm() {
     get_genai_comps
 
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build agent image with --no-cache..."

@@ -82,7 +82,7 @@ services:
   vllm-gaudi:
     build:
       context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      dockerfile: docker/Dockerfile.hpu
     extends: audioqna
     image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   vllm-rocm:

@@ -27,7 +27,7 @@ function build_docker_images() {
 
     git clone https://github.com/HabanaAI/vllm-fork.git
     cd vllm-fork/
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     echo "Check out vLLM tag ${VLLM_FORK_VER}"
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 

@@ -123,7 +123,7 @@ services:
   vllm-gaudi:
     build:
       context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      dockerfile: docker/Dockerfile.hpu
     extends: chatqna
     image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   nginx:

@@ -24,7 +24,7 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."

@@ -24,7 +24,7 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."

@@ -24,7 +24,7 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."

@@ -24,7 +24,7 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."

@@ -52,7 +52,7 @@ services:
   vllm-gaudi:
     build:
       context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      dockerfile: docker/Dockerfile.hpu
     extends: codegen
     image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   dataprep:

@@ -27,7 +27,7 @@ function build_docker_images() {
 
     # Download Gaudi vllm of latest tag
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     echo "Check out vLLM tag ${VLLM_FORK_VER}"
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 

@@ -34,7 +34,7 @@ services:
   vllm-gaudi:
     build:
       context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      dockerfile: docker/Dockerfile.hpu
     extends: codetrans
     image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
   nginx:

@@ -26,7 +26,7 @@ function build_docker_images() {
     popd && sleep 1s
 
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."

@@ -26,7 +26,7 @@ function build_docker_images() {
     docker build --no-cache -t ${REGISTRY}/comps-base:${TAG} --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy -f Dockerfile .
     popd && sleep 1s
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."

@@ -63,6 +63,6 @@ services:
   vllm-gaudi:
     build:
       context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      dockerfile: docker/Dockerfile.hpu
     extends: docsum
     image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
@@ -47,7 +47,7 @@ function build_docker_images() {
     popd && sleep 1s
 
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     echo "Build all the images with --no-cache, check docker_image_build.log for details..."

@@ -102,7 +102,7 @@ cd vllm-fork
 VLLM_VER=$(git describe --tags "$(git rev-list --tags --max-count=1)")
 echo "Check out vLLM tag ${VLLM_VER}"
 git checkout ${VLLM_VER}
-docker build --no-cache -f Dockerfile.hpu -t opea/vllm-gaudi:latest --shm-size=128g . --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy
+docker build --no-cache -f docker/Dockerfile.hpu -t opea/vllm-gaudi:latest --shm-size=128g . --build-arg https_proxy=$https_proxy --build-arg http_proxy=$http_proxy
 ```
 
 ## Validate Services

@@ -96,9 +96,9 @@ function build_vllm_docker_image() {
     fi
     cd ./vllm-fork
 
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null
-    docker build --no-cache -f Dockerfile.hpu -t $VLLM_IMAGE --shm-size=128g . --build-arg https_proxy=$HTTPS_PROXY --build-arg http_proxy=$HTTP_PROXY
+    docker build --no-cache -f docker/Dockerfile.hpu -t $VLLM_IMAGE --shm-size=128g . --build-arg https_proxy=$HTTPS_PROXY --build-arg http_proxy=$HTTP_PROXY
     if [ $? -ne 0 ]; then
         echo "$VLLM_IMAGE failed"
         exit 1

@@ -46,6 +46,6 @@ services:
   vllm-gaudi:
     build:
       context: vllm-fork
-      dockerfile: Dockerfile.hpu
+      dockerfile: docker/Dockerfile.hpu
     extends: visualqna
     image: ${REGISTRY:-opea}/vllm-gaudi:${TAG:-latest}
@@ -27,7 +27,7 @@ function build_docker_images() {
     popd && sleep 1s
 
     git clone https://github.com/HabanaAI/vllm-fork.git && cd vllm-fork
-    VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
+    VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
     git checkout ${VLLM_FORK_VER} &> /dev/null && cd ../
 
     service_list="visualqna visualqna-ui lvm nginx vllm-gaudi"

@@ -123,7 +123,7 @@ get_service_list() {
 # Defines the configurations for cloning prerequisite repositories.
 # A generic build function will use these settings.
 
-VLLM_FORK_VER="v0.6.6.post1+Gaudi-1.20.0"
+VLLM_FORK_VER=v0.8.5.post1+Gaudi-1.21.3
 
 # Config for examples using vLLM v0.8.3
 declare -A VLLM_8_3_CONFIG=(